From 40be71066c57f116e5a0a5a3329ba521ef5ce0f8 Mon Sep 17 00:00:00 2001
From: Doua Vue <dvue@newrelic.com>
Date: Tue, 17 Sep 2024 12:22:41 -0500
Subject: [PATCH 01/10] feat: Add new quickstart and alert policies for k8s
 otel

---
 .../ContainerCPUThrottling.yaml               | 76 ++++++++++++++++++
 .../ContainerHighCPUUtil.yaml                 | 76 ++++++++++++++++++
 .../ContainerHighMemUtil.yaml                 | 76 ++++++++++++++++++
 .../ContainerRestarting.yaml                  | 73 ++++++++++++++++++
 .../ContainerWaiting.yaml                     | 73 ++++++++++++++++++
 .../DaemonsetPodsMissing.yaml                 | 73 ++++++++++++++++++
 .../DeploymentPodsMissing.yaml                | 73 ++++++++++++++++++
 .../JobFailedOtel.yaml                        | 77 +++++++++++++++++++
 .../NodeHighAllocatableCPUUtil.yaml           | 76 ++++++++++++++++++
 .../NodeHighAllocatableMemUtil.yaml           | 76 ++++++++++++++++++
 .../NodeHighFSCapacityUtil.yaml               | 76 ++++++++++++++++++
 .../NodeIsNotReady.yaml                       | 77 +++++++++++++++++++
 .../NodePodCapacity.yaml                      | 77 +++++++++++++++++++
 .../PersistentVolumeErrors.yaml               | 73 ++++++++++++++++++
 .../kubernetes-opentelemetry/PodNotReady.yaml | 77 +++++++++++++++++++
 .../PodNotScheduled.yaml                      | 76 ++++++++++++++++++
 .../PodsFailingNamespace.yaml                 | 73 ++++++++++++++++++
 .../StatefulsetPodsMissing.yaml               | 73 ++++++++++++++++++
 .../kubernetes-opentelemetry/config.yml       | 54 +++++++++++++
 quickstarts/kubernetes-opentelemetry/logo.svg |  1 +
 20 files changed, 1406 insertions(+)
 create mode 100644 alert-policies/kubernetes-opentelemetry/ContainerCPUThrottling.yaml
 create mode 100644 alert-policies/kubernetes-opentelemetry/ContainerHighCPUUtil.yaml
 create mode 100644 alert-policies/kubernetes-opentelemetry/ContainerHighMemUtil.yaml
 create mode 100644 alert-policies/kubernetes-opentelemetry/ContainerRestarting.yaml
 create mode 100644 alert-policies/kubernetes-opentelemetry/ContainerWaiting.yaml
 create mode 100644 alert-policies/kubernetes-opentelemetry/DaemonsetPodsMissing.yaml
 create mode 100644 alert-policies/kubernetes-opentelemetry/DeploymentPodsMissing.yaml
 create mode 100644 alert-policies/kubernetes-opentelemetry/JobFailedOtel.yaml
 create mode 100644 alert-policies/kubernetes-opentelemetry/NodeHighAllocatableCPUUtil.yaml
 create mode 100644 alert-policies/kubernetes-opentelemetry/NodeHighAllocatableMemUtil.yaml
 create mode 100644 alert-policies/kubernetes-opentelemetry/NodeHighFSCapacityUtil.yaml
 create mode 100644 alert-policies/kubernetes-opentelemetry/NodeIsNotReady.yaml
 create mode 100644 alert-policies/kubernetes-opentelemetry/NodePodCapacity.yaml
 create mode 100644 alert-policies/kubernetes-opentelemetry/PersistentVolumeErrors.yaml
 create mode 100644 alert-policies/kubernetes-opentelemetry/PodNotReady.yaml
 create mode 100644 alert-policies/kubernetes-opentelemetry/PodNotScheduled.yaml
 create mode 100644 alert-policies/kubernetes-opentelemetry/PodsFailingNamespace.yaml
 create mode 100644 alert-policies/kubernetes-opentelemetry/StatefulsetPodsMissing.yaml
 create mode 100644 quickstarts/kubernetes-opentelemetry/config.yml
 create mode 100644 quickstarts/kubernetes-opentelemetry/logo.svg

diff --git a/alert-policies/kubernetes-opentelemetry/ContainerCPUThrottling.yaml b/alert-policies/kubernetes-opentelemetry/ContainerCPUThrottling.yaml
new file mode 100644
index 0000000000..896c786d39
--- /dev/null
+++ b/alert-policies/kubernetes-opentelemetry/ContainerCPUThrottling.yaml
@@ -0,0 +1,76 @@
+name: Container cpu throttling is high
+# Description and details
+description: |
+  Alert when container is being throttled > 25% of the time for more than 5 minutes
+
+# Type of alert: BASELINE | STATIC
+type: STATIC
+
+# NRQL query
+nrql:
+  query: "from Metric select latest(container_cpu_cfs_throttled_periods_total) / latest(container_cpu_cfs_periods_total)* 100 where k8s.cluster.name in ('YOUR_CLUSTER_NAME') and k8s.namespace.name in ('YOUR_NAMESPACE_NAME') facet k8s.container.name, k8s.pod.name, k8s.namespace.name, k8s.cluster.name"
+
+# Direction in which baseline is set (Default: LOWER_ONLY)
+# baselineDirection: LOWER_ONLY | UPPER_AND_LOWER | UPPER_ONLY
+
+# Function used to aggregate the NRQL query value(s) for comparison to the terms.threshold (Default: SINGLE_VALUE)
+valueFunction: SINGLE_VALUE
+
+# List of Critical and Warning thresholds for the condition
+terms:
+  - priority: CRITICAL
+    # Operator used to compare against the threshold.
+    operator: ABOVE
+    # Value that triggers a violation
+    threshold: 90
+    # Time in seconds; 120 - 3600, must be a multiple of 60 for Baseline conditions
+    thresholdDuration: 300
+    # How many data points must be in violation for the duration
+    thresholdOccurrences: ALL
+
+  # Adding a Warning threshold is optional
+  # - priority: WARNING
+  #   # Operator used to compare against the threshold.
+  #   operator: ABOVE
+  #   # Value that triggers a violation
+  #   threshold: 0
+  #   # Time in seconds; 120 - 3600, must be a multiple of 60 for Baseline conditions
+  #   thresholdDuration: 60
+  #   # How many data points must be in violation for the duration
+  #   thresholdOccurrences: AT_LEAST_ONCE
+
+# Loss of Signal Settings
+expiration:
+  # Close open violations if signal is lost (Default: false)
+  closeViolationsOnExpiration: true
+  # Open "Loss of Signal" violation if signal is lost (Default: false)
+  openViolationOnExpiration: false
+  # Time in seconds; Max value: 172800 (48hrs), null if closeViolationsOnExpiration and openViolationOnExpiration are both 'false'
+  expirationDuration: 300
+
+# Advanced Signal Settings
+# Duration of the time window used to evaluate the NRQL Condition
+signal:
+  # How long we wait for data that belongs in each aggregation window
+  aggregationDelay: 60 # seconds
+  # The method that determines when we consider an aggregation window to complete so that we can evaluate the signals for violations.
+  aggregationMethod: EVENT_FLOW
+  # How long we wait after each data point arrives to make sure we've processed the whole batch.
+  aggregationTimer: null # seconds
+  # Controls the duration of the time window used to evaluate the NRQL query
+  aggregationWindow: 300 # seconds; 30 seconds <= x < 15 minutes
+  # Option that determines the type of value that should be used to fill gaps (empty windows).
+  fillOption: NONE # defaults to STATIC
+  # If using the static fill option, this value is used for filling.
+  fillValue: null # default
+  # This setting gathers data in overlapping time windows to smooth the chart line, making it easier to spot trends.
+  slideBy: 60 # seconds
+  # Evaluation delay is how long we wait before we start evaluating a signal against the thresholds in this condition.
+  evaluationDelay: 60
+
+# OPTIONAL: URL of runbook to be sent with notification
+runbookUrl:
+
+# Duration after which a violation automatically closes
+# Time in seconds; 300 - 2592000 (Default: 86400 [1 day])
+violationTimeLimitSeconds: 21600
diff --git a/alert-policies/kubernetes-opentelemetry/ContainerHighCPUUtil.yaml b/alert-policies/kubernetes-opentelemetry/ContainerHighCPUUtil.yaml
new file mode 100644
index 0000000000..625670c141
--- /dev/null
+++ b/alert-policies/kubernetes-opentelemetry/ContainerHighCPUUtil.yaml
@@ -0,0 +1,76 @@
+name: Container high cpu utilization
+# Description and details
+description: |
+  Alert when the average container cpu utilization (vs. Limit) is > 90% for more than 5 minutes
+
+# Type of alert: BASELINE | STATIC
+type: STATIC
+
+# NRQL query
+nrql:
+  query: "from Metric select average(container.cpu.utilization) where k8s.cluster.name in ('YOUR_CLUSTER_NAME') and k8s.namespace.name in ('YOUR_NAMESPACE_NAME') facet k8s.container.name, k8s.pod.name, k8s.namespace.name, k8s.cluster.name"
+
+# Direction in which baseline is set (Default: LOWER_ONLY)
+# baselineDirection: LOWER_ONLY | UPPER_AND_LOWER | UPPER_ONLY
+
+# Function used to aggregate the NRQL query value(s) for comparison to the terms.threshold (Default: SINGLE_VALUE)
+valueFunction: SINGLE_VALUE
+
+# List of Critical and Warning thresholds for the condition
+terms:
+  - priority: CRITICAL
+    # Operator used to compare against the threshold.
+    operator: ABOVE
+    # Value that triggers a violation
+    threshold: 90
+    # Time in seconds; 120 - 3600, must be a multiple of 60 for Baseline conditions
+    thresholdDuration: 300
+    # How many data points must be in violation for the duration
+    thresholdOccurrences: ALL
+
+  # Adding a Warning threshold is optional
+  # - priority: WARNING
+  #   # Operator used to compare against the threshold.
+  #   operator: ABOVE
+  #   # Value that triggers a violation
+  #   threshold: 0
+  #   # Time in seconds; 120 - 3600, must be a multiple of 60 for Baseline conditions
+  #   thresholdDuration: 60
+  #   # How many data points must be in violation for the duration
+  #   thresholdOccurrences: AT_LEAST_ONCE
+
+# Loss of Signal Settings
+expiration:
+  # Close open violations if signal is lost (Default: false)
+  closeViolationsOnExpiration: true
+  # Open "Loss of Signal" violation if signal is lost (Default: false)
+  openViolationOnExpiration: false
+  # Time in seconds; Max value: 172800 (48hrs), null if closeViolationsOnExpiration and openViolationOnExpiration are both 'false'
+  expirationDuration: 300
+
+# Advanced Signal Settings
+# Duration of the time window used to evaluate the NRQL Condition
+signal:
+  # How long we wait for data that belongs in each aggregation window
+  aggregationDelay: 60 # seconds
+  # The method that determines when we consider an aggregation window to complete so that we can evaluate the signals for violations.
+  aggregationMethod: EVENT_FLOW
+  # How long we wait after each data point arrives to make sure we've processed the whole batch.
+  aggregationTimer: null # seconds
+  # Controls the duration of the time window used to evaluate the NRQL query
+  aggregationWindow: 300 # seconds; 30 seconds <= x < 15 minutes
+  # Option that determines the type of value that should be used to fill gaps (empty windows).
+  fillOption: NONE # defaults to STATIC
+  # If using the static fill option, this value is used for filling.
+  fillValue: null # default
+  # This setting gathers data in overlapping time windows to smooth the chart line, making it easier to spot trends.
+  slideBy: 60 # seconds
+  # Evaluation delay is how long we wait before we start evaluating a signal against the thresholds in this condition.
+  evaluationDelay: 60
+
+# OPTIONAL: URL of runbook to be sent with notification
+runbookUrl:
+
+# Duration after which a violation automatically closes
+# Time in seconds; 300 - 2592000 (Default: 86400 [1 day])
+violationTimeLimitSeconds: 21600
diff --git a/alert-policies/kubernetes-opentelemetry/ContainerHighMemUtil.yaml b/alert-policies/kubernetes-opentelemetry/ContainerHighMemUtil.yaml
new file mode 100644
index 0000000000..fe3db565c0
--- /dev/null
+++ b/alert-policies/kubernetes-opentelemetry/ContainerHighMemUtil.yaml
@@ -0,0 +1,76 @@
+name: Container high memory utilization
+# Description and details
+description: |
+  Alert when the average container memory utilization (vs. Limit) is > 90% for more than 5 minutes
+
+# Type of alert: BASELINE | STATIC
+type: STATIC
+
+# NRQL query
+nrql:
+  query: "from Metric max(container_memory_working_set_bytes) / filter(max(kube_pod_container_resource_limits), where resource = 'memory') where k8s.cluster.name in ('YOUR_CLUSTER_NAME') and k8s.namespace.name in ('YOUR_NAMESPACE_NAME') facet k8s.container.name, k8s.pod.name, k8s.namespace.name, k8s.cluster.name"
+
+# Direction in which baseline is set (Default: LOWER_ONLY)
+# baselineDirection: LOWER_ONLY | UPPER_AND_LOWER | UPPER_ONLY
+
+# Function used to aggregate the NRQL query value(s) for comparison to the terms.threshold (Default: SINGLE_VALUE)
+valueFunction: SINGLE_VALUE
+
+# List of Critical and Warning thresholds for the condition
+terms:
+  - priority: CRITICAL
+    # Operator used to compare against the threshold.
+    operator: ABOVE
+    # Value that triggers a violation
+    threshold: 90
+    # Time in seconds; 120 - 3600, must be a multiple of 60 for Baseline conditions
+    thresholdDuration: 300
+    # How many data points must be in violation for the duration
+    thresholdOccurrences: ALL
+
+  # Adding a Warning threshold is optional
+  # - priority: WARNING
+  #   # Operator used to compare against the threshold.
+  #   operator: ABOVE
+  #   # Value that triggers a violation
+  #   threshold: 0
+  #   # Time in seconds; 120 - 3600, must be a multiple of 60 for Baseline conditions
+  #   thresholdDuration: 60
+  #   # How many data points must be in violation for the duration
+  #   thresholdOccurrences: AT_LEAST_ONCE
+
+# Loss of Signal Settings
+expiration:
+  # Close open violations if signal is lost (Default: false)
+  closeViolationsOnExpiration: true
+  # Open "Loss of Signal" violation if signal is lost (Default: false)
+  openViolationOnExpiration: false
+  # Time in seconds; Max value: 172800 (48hrs), null if closeViolationsOnExpiration and openViolationOnExpiration are both 'false'
+  expirationDuration: 300
+
+# Advanced Signal Settings
+# Duration of the time window used to evaluate the NRQL Condition
+signal:
+  # How long we wait for data that belongs in each aggregation window
+  aggregationDelay: 60 # seconds
+  # The method that determines when we consider an aggregation window to complete so that we can evaluate the signals for violations.
+  aggregationMethod: EVENT_FLOW
+  # How long we wait after each data point arrives to make sure we've processed the whole batch.
+  aggregationTimer: null # seconds
+  # Controls the duration of the time window used to evaluate the NRQL query
+  aggregationWindow: 300 # seconds; 30 seconds <= x < 15 minutes
+  # Option that determines the type of value that should be used to fill gaps (empty windows).
+  fillOption: NONE # defaults to STATIC
+  # If using the static fill option, this value is used for filling.
+  fillValue: null # default
+  # This setting gathers data in overlapping time windows to smooth the chart line, making it easier to spot trends.
+  slideBy: 60 # seconds
+  # Evaluation delay is how long we wait before we start evaluating a signal against the thresholds in this condition.
+  evaluationDelay: 60
+
+# OPTIONAL: URL of runbook to be sent with notification
+runbookUrl:
+
+# Duration after which a violation automatically closes
+# Time in seconds; 300 - 2592000 (Default: 86400 [1 day])
+violationTimeLimitSeconds: 21600
diff --git a/alert-policies/kubernetes-opentelemetry/ContainerRestarting.yaml b/alert-policies/kubernetes-opentelemetry/ContainerRestarting.yaml
new file mode 100644
index 0000000000..9df6519ebd
--- /dev/null
+++ b/alert-policies/kubernetes-opentelemetry/ContainerRestarting.yaml
@@ -0,0 +1,73 @@
+name: Container is Restarting
+
+# Description and details
+description: |
+  Alert when the container restart count is greater than 0 in a sliding 5 minute window
+
+# Type of alert: BASELINE | STATIC
+type: STATIC
+
+# NRQL query
+nrql:
+  query: "from Metric select sum(kube_pod_container_status_restarts_total) where metricName = 'kube_pod_container_status_restarts_total' and k8s.cluster.name in ('YOUR_CLUSTER_NAME') and k8s.namespace.name in ('YOUR_NAMESPACE_NAME') FACET k8s.container.name, k8s.pod.name, k8s.namespace.name, k8s.cluster.name"
+
+# Direction in which baseline is set (Default: LOWER_ONLY)
+# baselineDirection: LOWER_ONLY | UPPER_AND_LOWER | UPPER_ONLY
+
+# Function used to aggregate the NRQL query value(s) for comparison to the terms.threshold (Default: SINGLE_VALUE)
+valueFunction: SINGLE_VALUE
+
+# List of Critical and Warning thresholds for the condition
+terms:
+  - priority: CRITICAL
+    # Operator used to compare against the threshold.
+    operator: ABOVE
+    # Value that triggers a violation
+    threshold: 0
+    # Time in seconds; 120 - 3600, must be a multiple of 60 for Baseline conditions
+    thresholdDuration: 300
+    # How many data points must be in violation for the duration
+    thresholdOccurrences: ALL
+
+  # Adding a Warning threshold is optional
+  # - priority: WARNING
+  #   operator: ABOVE
+  #   threshold: 1
+  #   thresholdDuration: 300
+  #   thresholdOccurrences: ALL | AT_LEAST_ONCE
+
+# Loss of Signal Settings
+expiration:
+  # Close open violations if signal is lost (Default: false)
+  closeViolationsOnExpiration: true
+  # Open "Loss of Signal" violation if signal is lost (Default: false)
+  openViolationOnExpiration: false
+  # Time in seconds; Max value: 172800 (48hrs), null if closeViolationsOnExpiration and openViolationOnExpiration are both 'false'
+  expirationDuration: 300
+
+# Advanced Signal Settings
+# Duration of the time window used to evaluate the NRQL Condition
+signal:
+  # How long we wait for data that belongs in each aggregation window
+  aggregationDelay: 60 # seconds
+  # The method that determines when we consider an aggregation window to complete so that we can evaluate the signals for violations.
+  aggregationMethod: EVENT_FLOW
+  # How long we wait after each data point arrives to make sure we've processed the whole batch.
+  aggregationTimer: null # seconds
+  # Controls the duration of the time window used to evaluate the NRQL query
+  aggregationWindow: 300 # seconds; 30 seconds <= x < 15 minutes
+  # Option that determines the type of value that should be used to fill gaps (empty windows).
+  fillOption: NONE # defaults to STATIC
+  # If using the static fill option, this value is used for filling.
+  fillValue: null # default
+  # This setting gathers data in overlapping time windows to smooth the chart line, making it easier to spot trends.
+  slideBy: 60 # seconds
+  # Evaluation delay is how long we wait before we start evaluating a signal against the thresholds in this condition.
+  evaluationDelay: 60
+
+# OPTIONAL: URL of runbook to be sent with notification
+runbookUrl:
+
+# Duration after which a violation automatically closes
+# Time in seconds; 300 - 2592000 (Default: 86400 [1 day])
+violationTimeLimitSeconds: 21600
diff --git a/alert-policies/kubernetes-opentelemetry/ContainerWaiting.yaml b/alert-policies/kubernetes-opentelemetry/ContainerWaiting.yaml
new file mode 100644
index 0000000000..d47e2bc813
--- /dev/null
+++ b/alert-policies/kubernetes-opentelemetry/ContainerWaiting.yaml
@@ -0,0 +1,73 @@
+name: Container is Waiting
+
+# Description and details
+description: |
+  Alert when a container is Waiting for more than 5 minutes
+
+# Type of alert: BASELINE | STATIC
+type: STATIC
+
+# NRQL query
+nrql:
+  query: "from Metric select uniqueCount(k8s.pod.name) WHERE container_phase = 'waiting' and k8s.cluster.name in ('YOUR_CLUSTER_NAME') and k8s.namespace.name in ('YOUR_NAMESPACE_NAME') FACET k8s.container.name, k8s.pod.name, k8s.namespace.name, k8s.cluster.name"
+
+# Direction in which baseline is set (Default: LOWER_ONLY)
+# baselineDirection: LOWER_ONLY | UPPER_AND_LOWER | UPPER_ONLY
+
+# Function used to aggregate the NRQL query value(s) for comparison to the terms.threshold (Default: SINGLE_VALUE)
+valueFunction: SINGLE_VALUE
+
+# List of Critical and Warning thresholds for the condition
+terms:
+  - priority: CRITICAL
+    # Operator used to compare against the threshold.
+    operator: ABOVE
+    # Value that triggers a violation
+    threshold: 0
+    # Time in seconds; 120 - 3600, must be a multiple of 60 for Baseline conditions
+    thresholdDuration: 300
+    # How many data points must be in violation for the duration
+    thresholdOccurrences: ALL
+
+  # Adding a Warning threshold is optional
+  # - priority: WARNING
+  #   operator: ABOVE
+  #   threshold: 1
+  #   thresholdDuration: 300
+  #   thresholdOccurrences: ALL | AT_LEAST_ONCE
+
+# Loss of Signal Settings
+expiration:
+  # Close open violations if signal is lost (Default: false)
+  closeViolationsOnExpiration: true
+  # Open "Loss of Signal" violation if signal is lost (Default: false)
+  openViolationOnExpiration: false
+  # Time in seconds; Max value: 172800 (48hrs), null if closeViolationsOnExpiration and openViolationOnExpiration are both 'false'
+  expirationDuration: 300
+
+# Advanced Signal Settings
+# Duration of the time window used to evaluate the NRQL Condition
+signal:
+  # How long we wait for data that belongs in each aggregation window
+  aggregationDelay: 60 # seconds
+  # The method that determines when we consider an aggregation window to complete so that we can evaluate the signals for violations.
+  aggregationMethod: EVENT_FLOW
+  # How long we wait after each data point arrives to make sure we've processed the whole batch.
+  aggregationTimer: null # seconds
+  # Controls the duration of the time window used to evaluate the NRQL query
+  aggregationWindow: 60 # seconds; 30 seconds <= x < 15 minutes
+  # Option that determines the type of value that should be used to fill gaps (empty windows).
+  fillOption: NONE # defaults to STATIC
+  # If using the static fill option, this value is used for filling.
+  fillValue: null # default
+  # This setting gathers data in overlapping time windows to smooth the chart line, making it easier to spot trends.
+  slideBy: null # seconds
+  # Evaluation delay is how long we wait before we start evaluating a signal against the thresholds in this condition.
+  evaluationDelay: 60
+
+# OPTIONAL: URL of runbook to be sent with notification
+runbookUrl:
+
+# Duration after which a violation automatically closes
+# Time in seconds; 300 - 2592000 (Default: 86400 [1 day])
+violationTimeLimitSeconds: 21600
diff --git a/alert-policies/kubernetes-opentelemetry/DaemonsetPodsMissing.yaml b/alert-policies/kubernetes-opentelemetry/DaemonsetPodsMissing.yaml
new file mode 100644
index 0000000000..3dd5ae52f3
--- /dev/null
+++ b/alert-policies/kubernetes-opentelemetry/DaemonsetPodsMissing.yaml
@@ -0,0 +1,73 @@
+name: Daemonset is missing Pods
+
+# Description and details
+description: |
+  Alert when Daemonset is missing Pods for > 5 minutes
+
+# Type of alert: BASELINE | STATIC
+type: STATIC
+
+# NRQL query
+nrql:
+  query: "from Metric select latest(kube_daemonset_status_desired_number_scheduled) - latest(kube_daemonset_status_number_ready) where k8s.cluster.name in ('YOUR_CLUSTER_NAME') and k8s.namespace.name in ('YOUR_NAMESPACE_NAME') facet k8s.daemonset.name, k8s.namespace.name, k8s.cluster.name"
+
+# Direction in which baseline is set (Default: LOWER_ONLY)
+# baselineDirection: LOWER_ONLY | UPPER_AND_LOWER | UPPER_ONLY
+
+# Function used to aggregate the NRQL query value(s) for comparison to the terms.threshold (Default: SINGLE_VALUE)
+valueFunction: SINGLE_VALUE
+
+# List of Critical and Warning thresholds for the condition
+terms:
+  - priority: CRITICAL
+    # Operator used to compare against the threshold.
+    operator: ABOVE
+    # Value that triggers a violation
+    threshold: 0
+    # Time in seconds; 120 - 3600, must be a multiple of 60 for Baseline conditions
+    thresholdDuration: 300
+    # How many data points must be in violation for the duration
+    thresholdOccurrences: ALL
+
+  # Adding a Warning threshold is optional
+  # - priority: WARNING
+  #   operator: ABOVE
+  #   threshold: 1
+  #   thresholdDuration: 300
+  #   thresholdOccurrences: ALL | AT_LEAST_ONCE
+
+# Loss of Signal Settings
+expiration:
+  # Close open violations if signal is lost (Default: false)
+  closeViolationsOnExpiration: true
+  # Open "Loss of Signal" violation if signal is lost (Default: false)
+  openViolationOnExpiration: false
+  # Time in seconds; Max value: 172800 (48hrs), null if closeViolationsOnExpiration and openViolationOnExpiration are both 'false'
+  expirationDuration: 300
+
+# Advanced Signal Settings
+# Duration of the time window used to evaluate the NRQL Condition
+signal:
+  # How long we wait for data that belongs in each aggregation window
+  aggregationDelay: 60 # seconds
+  # The method that determines when we consider an aggregation window to complete so that we can evaluate the signals for violations.
+  aggregationMethod: EVENT_FLOW
+  # How long we wait after each data point arrives to make sure we've processed the whole batch.
+  aggregationTimer: null # seconds
+  # Controls the duration of the time window used to evaluate the NRQL query
+  aggregationWindow: 60 # seconds; 30 seconds <= x < 15 minutes
+  # Option that determines the type of value that should be used to fill gaps (empty windows).
+  fillOption: NONE # defaults to STATIC
+  # If using the static fill option, this value is used for filling.
+  fillValue: null # default
+  # This setting gathers data in overlapping time windows to smooth the chart line, making it easier to spot trends.
+  slideBy: null # seconds
+  # Evaluation delay is how long we wait before we start evaluating a signal against the thresholds in this condition.
+  evaluationDelay: 60
+
+# OPTIONAL: URL of runbook to be sent with notification
+runbookUrl:
+
+# Duration after which a violation automatically closes
+# Time in seconds; 300 - 2592000 (Default: 86400 [1 day])
+violationTimeLimitSeconds: 21600
diff --git a/alert-policies/kubernetes-opentelemetry/DeploymentPodsMissing.yaml b/alert-policies/kubernetes-opentelemetry/DeploymentPodsMissing.yaml
new file mode 100644
index 0000000000..0dc3e4f664
--- /dev/null
+++ b/alert-policies/kubernetes-opentelemetry/DeploymentPodsMissing.yaml
@@ -0,0 +1,73 @@
+name: Deployment is missing Pods
+
+# Description and details
+description: |
+  Alert when Deployment is missing Pods for > 5 minutes
+
+# Type of alert: BASELINE | STATIC
+type: STATIC
+
+# NRQL query
+nrql:
+  query: "from Metric select latest(kube_deployment_spec_replicas) - latest(kube_deployment_status_replicas) where k8s.cluster.name in ('YOUR_CLUSTER_NAME') and k8s.namespace.name in ('YOUR_NAMESPACE_NAME') facet k8s.deployment.name, k8s.namespace.name, k8s.cluster.name"
+
+# Direction in which baseline is set (Default: LOWER_ONLY)
+# baselineDirection: LOWER_ONLY | UPPER_AND_LOWER | UPPER_ONLY
+
+# Function used to aggregate the NRQL query value(s) for comparison to the terms.threshold (Default: SINGLE_VALUE)
+valueFunction: SINGLE_VALUE
+
+# List of Critical and Warning thresholds for the condition
+terms:
+  - priority: CRITICAL
+    # Operator used to compare against the threshold.
+    operator: ABOVE
+    # Value that triggers a violation
+    threshold: 0
+    # Time in seconds; 120 - 3600, must be a multiple of 60 for Baseline conditions
+    thresholdDuration: 300
+    # How many data points must be in violation for the duration
+    thresholdOccurrences: ALL
+
+  # Adding a Warning threshold is optional
+  # - priority: WARNING
+  #   operator: ABOVE
+  #   threshold: 1
+  #   thresholdDuration: 300
+  #   thresholdOccurrences: ALL | AT_LEAST_ONCE
+
+# Loss of Signal Settings
+expiration:
+  # Close open violations if signal is lost (Default: false)
+  closeViolationsOnExpiration: true
+  # Open "Loss of Signal" violation if signal is lost (Default: false)
+  openViolationOnExpiration: false
+  # Time in seconds; Max value: 172800 (48hrs), null if closeViolationsOnExpiration and openViolationOnExpiration are both 'false'
+  expirationDuration: 300
+
+# Advanced Signal Settings
+# Duration of the time window used to evaluate the NRQL Condition
+signal:
+  # How long we wait for data that belongs in each aggregation window
+  aggregationDelay: 60 # seconds
+  # The method that determines when we consider an aggregation window to complete so that we can evaluate the signals for violations.
+  aggregationMethod: EVENT_FLOW
+  # How long we wait after each data point arrives to make sure we've processed the whole batch.
+  aggregationTimer: null # seconds
+  # Controls the duration of the time window used to evaluate the NRQL query
+  aggregationWindow: 60 # seconds; 30 seconds <= x < 15 minutes
+  # Option that determines the type of value that should be used to fill gaps (empty windows).
+  fillOption: NONE # defaults to STATIC
+  # If using the static fill option, this value is used for filling.
+  fillValue: null # default
+  # This setting gathers data in overlapping time windows to smooth the chart line, making it easier to spot trends.
+  slideBy: null # seconds
+  # Evaluation delay is how long we wait before we start evaluating a signal against the thresholds in this condition.
+  evaluationDelay: 60
+
+# OPTIONAL: URL of runbook to be sent with notification
+runbookUrl:
+
+# Duration after which a violation automatically closes
+# Time in seconds; 300 - 2592000 (Default: 86400 [1 day])
+violationTimeLimitSeconds: 21600
diff --git a/alert-policies/kubernetes-opentelemetry/JobFailedOtel.yaml b/alert-policies/kubernetes-opentelemetry/JobFailedOtel.yaml
new file mode 100644
index 0000000000..2b5c52374e
--- /dev/null
+++ b/alert-policies/kubernetes-opentelemetry/JobFailedOtel.yaml
@@ -0,0 +1,77 @@
+name: Job Failed
+
+# Description and details
+description: |
+  Alert when a Job reports a failed status
+
+# Type of alert: BASELINE | STATIC
+type: STATIC
+
+# NRQL query
+nrql:
+  query: "from Metric select if(latest(kube_job_failed), uniqueCount(job_name), 0) where k8s.cluster.name in ('YOUR_CLUSTER_NAME') and k8s.namespace.name in ('YOUR_NAMESPACE_NAME') facet job_name, k8s.namespace.name, k8s.cluster.name"
+
+# Direction in which baseline is set (Default: LOWER_ONLY)
+# baselineDirection: LOWER_ONLY | UPPER_AND_LOWER | UPPER_ONLY
+
+# Function used to aggregate the NRQL query value(s) for comparison to the terms.threshold (Default: SINGLE_VALUE)
+valueFunction: SINGLE_VALUE
+
+# List of Critical and Warning thresholds for the condition
+terms:
+  # - priority: CRITICAL
+  #   # Operator used to compare against the threshold.
+  #   operator: ABOVE
+  #   # Value that triggers a violation
+  #   threshold: 0
+  #   # Time in seconds; 120 - 3600, must be a multiple of 60 for Baseline conditions
+  #   thresholdDuration: 300
+  #   # How many data points must be in violation for the duration
+  #   thresholdOccurrences: ALL
+
+  # Adding a Warning threshold is optional
+  - priority: WARNING
+    # Operator used to compare against the threshold.
+    operator: ABOVE
+    # Value that triggers a violation
+    threshold: 0
+    # Time in seconds; 120 - 3600, must be a multiple of 60 for Baseline conditions
+    thresholdDuration: 60
+    # How many data points must be in violation for the duration
+    thresholdOccurrences: AT_LEAST_ONCE
+
+# Loss of Signal Settings
+expiration:
+  # Close open violations if signal is lost (Default: false)
+  closeViolationsOnExpiration: true
+  # Open "Loss of Signal" violation if signal is lost (Default: false)
+  openViolationOnExpiration: false
+  # Time in seconds; Max value: 172800 (48hrs), null if closeViolationsOnExpiration and openViolationOnExpiration are both 'false'
+  expirationDuration: 300
+
+# Advanced Signal Settings
+# Duration of the time window used to evaluate the NRQL Condition
+signal:
+  # How long we wait for data that belongs in each aggregation window
+  aggregationDelay: 60 # seconds
+  # The method that determines when we consider an aggregation window to complete so that we can evaluate the signals for violations.
+  aggregationMethod: EVENT_FLOW
+  # How long we wait after each data point arrives to make sure we've processed the whole batch.
+  aggregationTimer: null # seconds
+  # Controls the duration of the time window used to evaluate the NRQL query
+  aggregationWindow: 60 # seconds; 30 seconds <= x < 15 minutes
+  # Option that determines the type of value that should be used to fill gaps (empty windows).
+  fillOption: NONE # defaults to STATIC
+  # If using the static fill option, this value is used for filling.
+  fillValue: null # default
+  # This setting gathers data in overlapping time windows to smooth the chart line, making it easier to spot trends.
+  slideBy: null # seconds
+  # Evaluation delay is how long we wait before we start evaluating a signal against the thresholds in this condition.
+  evaluationDelay: null
+
+# OPTIONAL: URL of runbook to be sent with notification
+runbookUrl:
+
+# Duration after which a violation automatically closes
+# Time in seconds; 300 - 2592000 (Default: 86400 [1 day])
+violationTimeLimitSeconds: 21600
diff --git a/alert-policies/kubernetes-opentelemetry/NodeHighAllocatableCPUUtil.yaml b/alert-policies/kubernetes-opentelemetry/NodeHighAllocatableCPUUtil.yaml
new file mode 100644
index 0000000000..ecf61d4fe2
--- /dev/null
+++ b/alert-policies/kubernetes-opentelemetry/NodeHighAllocatableCPUUtil.yaml
@@ -0,0 +1,76 @@
+name: Node allocatable cpu utilization is high
+# Description and details
+description: |
+  Alert when the average Node allocatable cpu utilization is > 90% for more than 5 minutes
+
+# Type of alert: BASELINE | STATIC
+type: STATIC
+
+# NRQL query
+nrql:
+  query: "from Metric select latest(k8s.node.cpu.utilization) where k8s.cluster.name in ('YOUR_CLUSTER_NAME') facet k8s.node.name, k8s.cluster.name"
+
+# Direction in which baseline is set (Default: LOWER_ONLY)
+# baselineDirection: LOWER_ONLY | UPPER_AND_LOWER | UPPER_ONLY
+
+# Function used to aggregate the NRQL query value(s) for comparison to the terms.threshold (Default: SINGLE_VALUE)
+valueFunction: SINGLE_VALUE
+
+# List of Critical and Warning thresholds for the condition
+terms:
+  - priority: CRITICAL
+    # Operator used to compare against the threshold.
+    operator: ABOVE
+    # Value that triggers a violation
+    threshold: 90
+    # Time in seconds; 120 - 3600, must be a multiple of 60 for Baseline conditions
+    thresholdDuration: 300
+    # How many data points must be in violation for the duration
+    thresholdOccurrences: ALL
+
+  # Adding a Warning threshold is optional
+  # - priority: WARNING
+  #   # Operator used to compare against the threshold.
+  #   operator: ABOVE
+  #   # Value that triggers a violation
+  #   threshold: 0
+  #   # Time in seconds; 120 - 3600, must be a multiple of 60 for Baseline conditions
+  #   thresholdDuration: 60
+  #   # How many data points must be in violation for the duration
+  #   thresholdOccurrences: AT_LEAST_ONCE
+
+# Loss of Signal Settings
+expiration:
+  # Close open violations if signal is lost (Default: false)
+  closeViolationsOnExpiration: true
+  # Open "Loss of Signal" violation if signal is lost (Default: false)
+  openViolationOnExpiration: false
+  # Time in seconds; Max value: 172800 (48hrs), null if closeViolationsOnExpiration and openViolationOnExpiration are both 'false'
+  expirationDuration: 900
+
+# Advanced Signal Settings
+# Duration of the time window used to evaluate the NRQL Condition
+signal:
+  # How long we wait for data that belongs in each aggregation window
+  aggregationDelay: 60 # seconds
+  # The method that determines when we consider an aggregation window to complete so that we can evaluate the signals for violations.
+  aggregationMethod: EVENT_FLOW
+  # How long we wait after each data point arrives to make sure we've processed the whole batch.
+  aggregationTimer: null # seconds
+  # Controls the duration of the time window used to evaluate the NRQL query
+  aggregationWindow: 300 # seconds; 30 seconds <= x < 15 minutes
+  # Option that determines the type of value that should be used to fill gaps (empty windows).
+  fillOption: NONE # defaults to STATIC
+  # If using the static fill option, this value is used for filling.
+  fillValue: null # default
+  # This setting gathers data in overlapping time windows to smooth the chart line, making it easier to spot trends.
+  slideBy: 60 # seconds
+  # Evaluation delay is how long we wait before we start evaluating a signal against the thresholds in this condition.
+  evaluationDelay: 60
+
+# OPTIONAL: URL of runbook to be sent with notification
+runbookUrl:
+
+# Duration after which a violation automatically closes
+# Time in seconds; 300 - 2592000 (Default: 86400 [1 day])
+violationTimeLimitSeconds: 21600
diff --git a/alert-policies/kubernetes-opentelemetry/NodeHighAllocatableMemUtil.yaml b/alert-policies/kubernetes-opentelemetry/NodeHighAllocatableMemUtil.yaml
new file mode 100644
index 0000000000..da0e55aa99
--- /dev/null
+++ b/alert-policies/kubernetes-opentelemetry/NodeHighAllocatableMemUtil.yaml
@@ -0,0 +1,76 @@
+name: Node allocatable memory utilization is high
+# Description and details
+description: |
+  Alert when the average Node allocatable memory utilization is > 90% for more than 5 minutes
+
+# Type of alert: BASELINE | STATIC
+type: STATIC
+
+# NRQL query
+nrql:
+  query: "from Metric select latest(k8s.node.memory.working_set) / filter(latest(kube_node_status_allocatable), WHERE resource = 'memory')  where k8s.cluster.name in ('YOUR_CLUSTER_NAME') facet k8s.node.name, k8s.cluster.name"
+
+# Direction in which baseline is set (Default: LOWER_ONLY)
+# baselineDirection: LOWER_ONLY | UPPER_AND_LOWER | UPPER_ONLY
+
+# Function used to aggregate the NRQL query value(s) for comparison to the terms.threshold (Default: SINGLE_VALUE)
+valueFunction: SINGLE_VALUE
+
+# List of Critical and Warning thresholds for the condition
+terms:
+  - priority: CRITICAL
+    # Operator used to compare against the threshold.
+    operator: ABOVE
+    # Value that triggers a violation
+    threshold: 90
+    # Time in seconds; 120 - 3600, must be a multiple of 60 for Baseline conditions
+    thresholdDuration: 300
+    # How many data points must be in violation for the duration
+    thresholdOccurrences: ALL
+
+  # Adding a Warning threshold is optional
+  # - priority: WARNING
+  #   # Operator used to compare against the threshold.
+  #   operator: ABOVE
+  #   # Value that triggers a violation
+  #   threshold: 0
+  #   # Time in seconds; 120 - 3600, must be a multiple of 60 for Baseline conditions
+  #   thresholdDuration: 60
+  #   # How many data points must be in violation for the duration
+  #   thresholdOccurrences: AT_LEAST_ONCE
+
+# Loss of Signal Settings
+expiration:
+  # Close open violations if signal is lost (Default: false)
+  closeViolationsOnExpiration: true
+  # Open "Loss of Signal" violation if signal is lost (Default: false)
+  openViolationOnExpiration: false
+  # Time in seconds; Max value: 172800 (48hrs), null if closeViolationsOnExpiration and openViolationOnExpiration are both 'false'
+  expirationDuration: 900
+
+# Advanced Signal Settings
+# Duration of the time window used to evaluate the NRQL Condition
+signal:
+  # How long we wait for data that belongs in each aggregation window
+  aggregationDelay: 60 # seconds
+  # The method that determines when we consider an aggregation window to complete so that we can evaluate the signals for violations.
+  aggregationMethod: EVENT_FLOW
+  # How long we wait after each data point arrives to make sure we've processed the whole batch.
+  aggregationTimer: null # seconds
+  # Controls the duration of the time window used to evaluate the NRQL query
+  aggregationWindow: 300 # seconds; 30 seconds <= x < 15 minutes
+  # Option that determines the type of value that should be used to fill gaps (empty windows).
+  fillOption: NONE # defaults to STATIC
+  # If using the static fill option, this value is used for filling.
+  fillValue: null # default
+  # This setting gathers data in overlapping time windows to smooth the chart line, making it easier to spot trends.
+  slideBy: 60 # seconds
+  # Evaluation delay is how long we wait before we start evaluating a signal against the thresholds in this condition.
+  evaluationDelay: 60
+
+# OPTIONAL: URL of runbook to be sent with notification
+runbookUrl:
+
+# Duration after which a violation automatically closes
+# Time in seconds; 300 - 2592000 (Default: 86400 [1 day])
+violationTimeLimitSeconds: 21600
diff --git a/alert-policies/kubernetes-opentelemetry/NodeHighFSCapacityUtil.yaml b/alert-policies/kubernetes-opentelemetry/NodeHighFSCapacityUtil.yaml
new file mode 100644
index 0000000000..a09b71d454
--- /dev/null
+++ b/alert-policies/kubernetes-opentelemetry/NodeHighFSCapacityUtil.yaml
@@ -0,0 +1,76 @@
+name: Node root file system capacity utilization is high
+# Description and details
+description: |
+  Alert when the average Node root file system capacity utilization is > 90% for more than 5 minutes
+
+# Type of alert: BASELINE | STATIC
+type: STATIC
+
+# NRQL query
+nrql:
+  query: "from Metric select max(k8s.node.filesystem.usage) / max(k8s.node.filesystem.capacity) where k8s.cluster.name in ('YOUR_CLUSTER_NAME') facet k8s.node.name, k8s.cluster.name"
+
+# Direction in which baseline is set (Default: LOWER_ONLY)
+# baselineDirection: LOWER_ONLY | UPPER_AND_LOWER | UPPER_ONLY
+
+# Function used to aggregate the NRQL query value(s) for comparison to the terms.threshold (Default: SINGLE_VALUE)
+valueFunction: SINGLE_VALUE
+
+# List of Critical and Warning thresholds for the condition
+terms:
+  - priority: CRITICAL
+    # Operator used to compare against the threshold.
+    operator: ABOVE
+    # Value that triggers a violation
+    threshold: 90
+    # Time in seconds; 120 - 3600, must be a multiple of 60 for Baseline conditions
+    thresholdDuration: 300
+    # How many data points must be in violation for the duration
+    thresholdOccurrences: ALL
+
+  # Adding a Warning threshold is optional
+  # - priority: WARNING
+  #   # Operator used to compare against the threshold.
+  #   operator: ABOVE
+  #   # Value that triggers a violation
+  #   threshold: 0
+  #   # Time in seconds; 120 - 3600, must be a multiple of 60 for Baseline conditions
+  #   thresholdDuration: 60
+  #   # How many data points must be in violation for the duration
+  #   thresholdOccurrences: AT_LEAST_ONCE
+
+# Loss of Signal Settings
+expiration:
+  # Close open violations if signal is lost (Default: false)
+  closeViolationsOnExpiration: true
+  # Open "Loss of Signal" violation if signal is lost (Default: false)
+  openViolationOnExpiration: false
+  # Time in seconds; Max value: 172800 (48hrs), null if closeViolationsOnExpiration and openViolationOnExpiration are both 'false'
+  expirationDuration: 900
+
+# Advanced Signal Settings
+# Duration of the time window used to evaluate the NRQL Condition
+signal:
+  # How long we wait for data that belongs in each aggregation window
+  aggregationDelay: 60 # seconds
+  # The method that determines when we consider an aggregation window to complete so that we can evaluate the signals for violations.
+  aggregationMethod: EVENT_FLOW
+  # How long we wait after each data point arrives to make sure we've processed the whole batch.
+  aggregationTimer: null # seconds
+  # Controls the duration of the time window used to evaluate the NRQL query
+  aggregationWindow: 300 # seconds; 30 seconds <= x < 15 minutes
+  # Option that determines the type of value that should be used to fill gaps (empty windows).
+  fillOption: NONE # defaults to STATIC
+  # If using the static fill option, this value is used for filling.
+  fillValue: null # default
+  # This setting gathers data in overlapping time windows to smooth the chart line, making it easier to spot trends.
+  slideBy: 60 # seconds
+  # Evaluation delay is how long we wait before we start evaluating a signal against the thresholds in this condition.
+  evaluationDelay: 60
+
+# OPTIONAL: URL of runbook to be sent with notification
+runbookUrl:
+
+# Duration after which a violation automatically closes
+# Time in seconds; 300 - 2592000 (Default: 86400 [1 day])
+violationTimeLimitSeconds: 21600
diff --git a/alert-policies/kubernetes-opentelemetry/NodeIsNotReady.yaml b/alert-policies/kubernetes-opentelemetry/NodeIsNotReady.yaml
new file mode 100644
index 0000000000..b46ee313d6
--- /dev/null
+++ b/alert-policies/kubernetes-opentelemetry/NodeIsNotReady.yaml
@@ -0,0 +1,77 @@
+name: Node is not ready
+
+# Description and details
+description: |
+  Alert when a Node is not ready for > 5 minutes
+
+# Type of alert: BASELINE | STATIC
+type: STATIC
+
+# NRQL query
+nrql:
+  query: "from Metric if(latest(condition) = 'Ready', 0, 1) where k8s.cluster.name in ('YOUR_CLUSTER_NAME') facet k8s.node.name, k8s.cluster.name"
+
+# Direction in which baseline is set (Default: LOWER_ONLY)
+# baselineDirection: LOWER_ONLY | UPPER_AND_LOWER | UPPER_ONLY
+
+# Function used to aggregate the NRQL query value(s) for comparison to the terms.threshold (Default: SINGLE_VALUE)
+valueFunction: SINGLE_VALUE
+
+# List of Critical and Warning thresholds for the condition
+terms:
+  - priority: CRITICAL
+    # Operator used to compare against the threshold.
+    operator: BELOW
+    # Value that triggers a violation
+    threshold: 1
+    # Time in seconds; 120 - 3600, must be a multiple of 60 for Baseline conditions
+    thresholdDuration: 300
+    # How many data points must be in violation for the duration
+    thresholdOccurrences: ALL
+
+  # Adding a Warning threshold is optional
+  # - priority: WARNING
+  #   # Operator used to compare against the threshold.
+  #   operator: ABOVE
+  #   # Value that triggers a violation
+  #   threshold: 0
+  #   # Time in seconds; 120 - 3600, must be a multiple of 60 for Baseline conditions
+  #   thresholdDuration: 60
+  #   # How many data points must be in violation for the duration
+  #   thresholdOccurrences: AT_LEAST_ONCE
+
+# Loss of Signal Settings
+expiration:
+  # Close open violations if signal is lost (Default: false)
+  closeViolationsOnExpiration: true
+  # Open "Loss of Signal" violation if signal is lost (Default: false)
+  openViolationOnExpiration: false
+  # Time in seconds; Max value: 172800 (48hrs), null if closeViolationsOnExpiration and openViolationOnExpiration are both 'false'
+  expirationDuration: 300
+
+# Advanced Signal Settings
+# Duration of the time window used to evaluate the NRQL Condition
+signal:
+  # How long we wait for data that belongs in each aggregation window
+  aggregationDelay: 60 # seconds
+  # The method that determines when we consider an aggregation window to complete so that we can evaluate the signals for violations.
+  aggregationMethod: EVENT_FLOW
+  # How long we wait after each data point arrives to make sure we've processed the whole batch.
+  aggregationTimer: null # seconds
+  # Controls the duration of the time window used to evaluate the NRQL query
+  aggregationWindow: 60 # seconds; 30 seconds <= x < 15 minutes
+  # Option that determines the type of value that should be used to fill gaps (empty windows).
+  fillOption: NONE # defaults to STATIC
+  # If using the static fill option, this value is used for filling.
+  fillValue: null # default
+  # This setting gathers data in overlapping time windows to smooth the chart line, making it easier to spot trends.
+  slideBy: null # seconds
+  # Evaluation delay is how long we wait before we start evaluating a signal against the thresholds in this condition.
+  evaluationDelay: 300
+
+# OPTIONAL: URL of runbook to be sent with notification
+runbookUrl:
+
+# Duration after which a violation automatically closes
+# Time in seconds; 300 - 2592000 (Default: 86400 [1 day])
+violationTimeLimitSeconds: 21600
diff --git a/alert-policies/kubernetes-opentelemetry/NodePodCapacity.yaml b/alert-policies/kubernetes-opentelemetry/NodePodCapacity.yaml
new file mode 100644
index 0000000000..09c20296fd
--- /dev/null
+++ b/alert-policies/kubernetes-opentelemetry/NodePodCapacity.yaml
@@ -0,0 +1,77 @@
+name: Node Pod count nearing capacity
+
+# Description and details
+description: |
+  Alert when the Running pod count on a Node is > 90% of the Node's Pod Capacity for more than 5 minutes
+
+# Type of alert: BASELINE | STATIC
+type: STATIC
+
+# NRQL query
+nrql:
+  query: "FROM Metric select filter(uniqueCount(k8s.pod.name), where phase = 'Running' AND (metricName = 'kube_pod_status_phase' AND kube_pod_status_phase ['latest'] = 1) and created_by_kind != 'Job' ) / filter(latest(kube_node_status_allocatable), WHERE resource = 'cpu' ) * 100 as 'Pod Capacity %' where k8s.node.name != '' and k8s.node.name is not null and k8s.cluster.name in ('YOUR_CLUSTER_NAME') facet k8s.node.name, k8s.cluster.name"
+
+# Direction in which baseline is set (Default: LOWER_ONLY)
+# baselineDirection: LOWER_ONLY | UPPER_AND_LOWER | UPPER_ONLY
+
+# Function used to aggregate the NRQL query value(s) for comparison to the terms.threshold (Default: SINGLE_VALUE)
+valueFunction: SINGLE_VALUE
+
+# List of Critical and Warning thresholds for the condition
+terms:
+  # - priority: CRITICAL
+  #   # Operator used to compare against the threshold.
+  #   operator: ABOVE
+  #   # Value that triggers a violation
+  #   threshold: 90
+  #   # Time in seconds; 120 - 3600, must be a multiple of 60 for Baseline conditions
+  #   thresholdDuration: 300
+  #   # How many data points must be in violation for the duration
+  #   thresholdOccurrences: ALL
+
+  # Adding a Warning threshold is optional
+  - priority: WARNING
+    # Operator used to compare against the threshold.
+    operator: ABOVE
+    # Value that triggers a violation
+    threshold: 90
+    # Time in seconds; 120 - 3600, must be a multiple of 60 for Baseline conditions
+    thresholdDuration: 300
+    # How many data points must be in violation for the duration
+    thresholdOccurrences: ALL
+
+# Loss of Signal Settings
+expiration:
+  # Close open violations if signal is lost (Default: false)
+  closeViolationsOnExpiration: true
+  # Open "Loss of Signal" violation if signal is lost (Default: false)
+  openViolationOnExpiration: false
+  # Time in seconds; Max value: 172800 (48hrs), null if closeViolationsOnExpiration and openViolationOnExpiration are both 'false'
+  expirationDuration: 300
+
+# Advanced Signal Settings
+# Duration of the time window used to evaluate the NRQL Condition
+signal:
+  # How long we wait for data that belongs in each aggregation window
+  aggregationDelay: 60 # seconds
+  # The method that determines when we consider an aggregation window to complete so that we can evaluate the signals for violations.
+  aggregationMethod: EVENT_FLOW
+  # How long we wait after each data point arrives to make sure we've processed the whole batch.
+  aggregationTimer: null # seconds
+  # Controls the duration of the time window used to evaluate the NRQL query
+  aggregationWindow: 60 # seconds; 30 seconds <= x < 15 minutes
+  # Option that determines the type of value that should be used to fill gaps (empty windows).
+  fillOption: NONE # defaults to STATIC
+  # If using the static fill option, this value is used for filling.
+  fillValue: null # default
+  # This setting gathers data in overlapping time windows to smooth the chart line, making it easier to spot trends.
+  slideBy: null # seconds
+  # Evaluation delay is how long we wait before we start evaluating a signal against the thresholds in this condition.
+  evaluationDelay: 300
+
+# OPTIONAL: URL of runbook to be sent with notification
+runbookUrl:
+
+# Duration after which a violation automatically closes
+# Time in seconds; 300 - 2592000 (Default: 86400 [1 day])
+violationTimeLimitSeconds: 21600
diff --git a/alert-policies/kubernetes-opentelemetry/PersistentVolumeErrors.yaml b/alert-policies/kubernetes-opentelemetry/PersistentVolumeErrors.yaml
new file mode 100644
index 0000000000..73fd69119f
--- /dev/null
+++ b/alert-policies/kubernetes-opentelemetry/PersistentVolumeErrors.yaml
@@ -0,0 +1,73 @@
+name: Persistent Volume has errors
+
+# Description and details
+description: |
+  Alert when Persistent Volume is in a Failed or Pending state for more than 5 minutes
+
+# Type of alert: BASELINE | STATIC
+type: STATIC
+
+# NRQL query
+nrql:
+  query: "from Metric select uniqueCount(persistentvolume) where phase in ('Failed','Pending') and k8s.cluster.name in ('YOUR_CLUSTER_NAME') facet persistentvolume, k8s.cluster.name"
+
+# Direction in which baseline is set (Default: LOWER_ONLY)
+# baselineDirection: LOWER_ONLY | UPPER_AND_LOWER | UPPER_ONLY
+
+# Function used to aggregate the NRQL query value(s) for comparison to the terms.threshold (Default: SINGLE_VALUE)
+valueFunction: SINGLE_VALUE
+
+# List of Critical and Warning thresholds for the condition
+terms:
+  - priority: CRITICAL
+    # Operator used to compare against the threshold.
+    operator: ABOVE
+    # Value that triggers a violation
+    threshold: 0
+    # Time in seconds; 120 - 3600, must be a multiple of 60 for Baseline conditions
+    thresholdDuration: 300
+    # How many data points must be in violation for the duration
+    thresholdOccurrences: ALL
+
+  # Adding a Warning threshold is optional
+  # - priority: WARNING
+  #   operator: ABOVE
+  #   threshold: 1
+  #   thresholdDuration: 300
+  #   thresholdOccurrences: ALL | AT_LEAST_ONCE
+
+# Loss of Signal Settings
+expiration:
+  # Close open violations if signal is lost (Default: false)
+  closeViolationsOnExpiration: true
+  # Open "Loss of Signal" violation if signal is lost (Default: false)
+  openViolationOnExpiration: false
+  # Time in seconds; Max value: 172800 (48hrs), null if closeViolationsOnExpiration and openViolationOnExpiration are both 'false'
+  expirationDuration: 300
+
+# Advanced Signal Settings
+# Duration of the time window used to evaluate the NRQL Condition
+signal:
+  # How long we wait for data that belongs in each aggregation window
+  aggregationDelay: 60 # seconds
+  # The method that determines when we consider an aggregation window to complete so that we can evaluate the signals for violations.
+  aggregationMethod: EVENT_FLOW
+  # How long we wait after each data point arrives to make sure we've processed the whole batch.
+  aggregationTimer: null # seconds
+  # Controls the duration of the time window used to evaluate the NRQL query
+  aggregationWindow: 60 # seconds; 30 seconds <= x < 15 minutes
+  # Option that determines the type of value that should be used to fill gaps (empty windows).
+  fillOption: NONE # defaults to STATIC
+  # If using the static fill option, this value is used for filling.
+  fillValue: null # default
+  # This setting gathers data in overlapping time windows to smooth the chart line, making it easier to spot trends.
+  slideBy: null # seconds
+  # Evaluation delay is how long we wait before we start evaluating a signal against the thresholds in this condition.
+  evaluationDelay: 60
+
+# OPTIONAL: URL of runbook to be sent with notification
+runbookUrl:
+
+# Duration after which a violation automatically closes
+# Time in seconds; 300 - 2592000 (Default: 86400 [1 day])
+violationTimeLimitSeconds: 21600
diff --git a/alert-policies/kubernetes-opentelemetry/PodNotReady.yaml b/alert-policies/kubernetes-opentelemetry/PodNotReady.yaml
new file mode 100644
index 0000000000..1418e1189e
--- /dev/null
+++ b/alert-policies/kubernetes-opentelemetry/PodNotReady.yaml
@@ -0,0 +1,77 @@
+name: Pod is not ready
+
+# Description and details
+description: |
+  Alert when a Pod is not ready for > 5 minutes
+
+# Type of alert: BASELINE | STATIC
+type: STATIC
+
+# NRQL query
+nrql:
+  query: "from Metric select latest(kube_pod_status_ready) where k8s.cluster.name in ('YOUR_CLUSTER_NAME') and k8s.namespace.name in ('YOUR_NAMESPACE_NAME') facet k8s.pod.name, k8s.namespace.name, k8s.cluster.name"
+
+# Direction in which baseline is set (Default: LOWER_ONLY)
+# baselineDirection: LOWER_ONLY | UPPER_AND_LOWER | UPPER_ONLY
+
+# Function used to aggregate the NRQL query value(s) for comparison to the terms.threshold (Default: SINGLE_VALUE)
+valueFunction: SINGLE_VALUE
+
+# List of Critical and Warning thresholds for the condition
+terms:
+  - priority: CRITICAL
+    # Operator used to compare against the threshold.
+    operator: BELOW
+    # Value that triggers a violation
+    threshold: 1
+    # Time in seconds; 120 - 3600, must be a multiple of 60 for Baseline conditions
+    thresholdDuration: 300
+    # How many data points must be in violation for the duration
+    thresholdOccurrences: ALL
+
+  # Adding a Warning threshold is optional
+  # - priority: WARNING
+  #   # Operator used to compare against the threshold.
+  #   operator: ABOVE
+  #   # Value that triggers a violation
+  #   threshold: 0
+  #   # Time in seconds; 120 - 3600, must be a multiple of 60 for Baseline conditions
+  #   thresholdDuration: 60
+  #   # How many data points must be in violation for the duration
+  #   thresholdOccurrences: AT_LEAST_ONCE
+
+# Loss of Signal Settings
+expiration:
+  # Close open violations if signal is lost (Default: false)
+  closeViolationsOnExpiration: true
+  # Open "Loss of Signal" violation if signal is lost (Default: false)
+  openViolationOnExpiration: false
+  # Time in seconds; Max value: 172800 (48hrs), null if closeViolationsOnExpiration and openViolationOnExpiration are both 'false'
+  expirationDuration: 300
+
+# Advanced Signal Settings
+# Duration of the time window used to evaluate the NRQL Condition
+signal:
+  # How long we wait for data that belongs in each aggregation window
+  aggregationDelay: 60 # seconds
+  # The method that determines when we consider an aggregation window to complete so that we can evaluate the signals for violations.
+  aggregationMethod: EVENT_FLOW
+  # How long we wait after each data point arrives to make sure we've processed the whole batch.
+  aggregationTimer: null # seconds
+  # Controls the duration of the time window used to evaluate the NRQL query
+  aggregationWindow: 60 # seconds; 30 seconds <= x < 15 minutes
+  # Option that determines the type of value that should be used to fill gaps (empty windows).
+  fillOption: NONE # defaults to STATIC
+  # If using the static fill option, this value is used for filling.
+  fillValue: null # default
+  # This setting gathers data in overlapping time windows to smooth the chart line, making it easier to spot trends.
+  slideBy: null # seconds
+  # Evaluation delay is how long we wait before we start evaluating a signal against the thresholds in this condition.
+  evaluationDelay: 60
+
+# OPTIONAL: URL of runbook to be sent with notification
+runbookUrl:
+
+# Duration after which a violation automatically closes
+# Time in seconds; 300 - 2592000 (Default: 86400 [1 day])
+violationTimeLimitSeconds: 21600
diff --git a/alert-policies/kubernetes-opentelemetry/PodNotScheduled.yaml b/alert-policies/kubernetes-opentelemetry/PodNotScheduled.yaml
new file mode 100644
index 0000000000..38aea1d89d
--- /dev/null
+++ b/alert-policies/kubernetes-opentelemetry/PodNotScheduled.yaml
@@ -0,0 +1,76 @@
+name: Pod cannot be scheduled
+
+# Description and details
+description: |
+  Alert when a Pod cannot be scheduled for more than 5 minutes
+# Type of alert: BASELINE | STATIC
+type: STATIC
+
+# NRQL query
+nrql:
+  query: "from Metric select latest(kube_pod_status_scheduled) where k8s.cluster.name in ('YOUR_CLUSTER_NAME') and k8s.namespace.name in ('YOUR_NAMESPACE_NAME') and metricName = 'kube_pod_status_scheduled' facet k8s.pod.name, k8s.namespace.name, k8s.cluster.name"
+
+# Direction in which baseline is set (Default: LOWER_ONLY)
+# baselineDirection: LOWER_ONLY | UPPER_AND_LOWER | UPPER_ONLY
+
+# Function used to aggregate the NRQL query value(s) for comparison to the terms.threshold (Default: SINGLE_VALUE)
+valueFunction: SINGLE_VALUE
+
+# List of Critical and Warning thresholds for the condition
+terms:
+  - priority: CRITICAL
+    # Operator used to compare against the threshold.
+    operator: BELOW
+    # Value that triggers a violation
+    threshold: 1
+    # Time in seconds; 120 - 3600, must be a multiple of 60 for Baseline conditions
+    thresholdDuration: 300
+    # How many data points must be in violation for the duration
+    thresholdOccurrences: ALL
+
+  # Adding a Warning threshold is optional
+  # - priority: WARNING
+  #   # Operator used to compare against the threshold.
+  #   operator: ABOVE
+  #   # Value that triggers a violation
+  #   threshold: 0
+  #   # Time in seconds; 120 - 3600, must be a multiple of 60 for Baseline conditions
+  #   thresholdDuration: 60
+  #   # How many data points must be in violation for the duration
+  #   thresholdOccurrences: AT_LEAST_ONCE
+
+# Loss of Signal Settings
+expiration:
+  # Close open violations if signal is lost (Default: false)
+  closeViolationsOnExpiration: true
+  # Open "Loss of Signal" violation if signal is lost (Default: false)
+  openViolationOnExpiration: false
+  # Time in seconds; Max value: 172800 (48hrs), null if closeViolationsOnExpiration and openViolationOnExpiration are both 'false'
+  expirationDuration: 300
+
+# Advanced Signal Settings
+# Duration of the time window used to evaluate the NRQL Condition
+signal:
+  # How long we wait for data that belongs in each aggregation window
+  aggregationDelay: 60 # seconds
+  # The method that determines when we consider an aggregation window to complete so that we can evaluate the signals for violations.
+  aggregationMethod: EVENT_FLOW
+  # How long we wait after each data point arrives to make sure we've processed the whole batch.
+  aggregationTimer: null # seconds
+  # Controls the duration of the time window used to evaluate the NRQL query
+  aggregationWindow: 60 # seconds; 30 seconds <= x < 15 minutes
+  # Option that determines the type of value that should be used to fill gaps (empty windows).
+  fillOption: NONE # defaults to STATIC
+  # If using the static fill option, this value is used for filling.
+  fillValue: null # default
+  # This setting gathers data in overlapping time windows to smooth the chart line, making it easier to spot trends.
+  slideBy: null # seconds
+  # Evaluation delay is how long we wait before we start evaluating a signal against the thresholds in this condition.
+  evaluationDelay: 60
+
+# OPTIONAL: URL of runbook to be sent with notification
+runbookUrl:
+
+# Duration after which a violation automatically closes
+# Time in seconds; 300 - 2592000 (Default: 86400 [1 day])
+violationTimeLimitSeconds: 21600
diff --git a/alert-policies/kubernetes-opentelemetry/PodsFailingNamespace.yaml b/alert-policies/kubernetes-opentelemetry/PodsFailingNamespace.yaml
new file mode 100644
index 0000000000..e8926f955c
--- /dev/null
+++ b/alert-policies/kubernetes-opentelemetry/PodsFailingNamespace.yaml
@@ -0,0 +1,73 @@
+name: More than 5 pods failing in namespace
+
+# Description and details
+description: |
+  Alert when more than 5 pods are failing in a namespace for more than 5 minutes
+
+# Type of alert: BASELINE | STATIC
+type: STATIC
+
+# NRQL query
+nrql:
+  query: "from Metric select uniqueCount(k8s.pod.name) where k8s.cluster.name in ('YOUR_CLUSTER_NAME') and k8s.namespace.name in ('YOUR_NAMESPACE_NAME') and phase = 'Failed' facet k8s.namespace.name, k8s.cluster.name"
+
+# Direction in which baseline is set (Default: LOWER_ONLY)
+# baselineDirection: LOWER_ONLY | UPPER_AND_LOWER | UPPER_ONLY
+
+# Function used to aggregate the NRQL query value(s) for comparison to the terms.threshold (Default: SINGLE_VALUE)
+valueFunction: SINGLE_VALUE
+
+# List of Critical and Warning thresholds for the condition
+terms:
+  - priority: CRITICAL
+    # Operator used to compare against the threshold.
+    operator: ABOVE
+    # Value that triggers a violation
+    threshold: 0
+    # Time in seconds; 120 - 3600, must be a multiple of 60 for Baseline conditions
+    thresholdDuration: 300
+    # How many data points must be in violation for the duration
+    thresholdOccurrences: ALL
+
+  # Adding a Warning threshold is optional
+  # - priority: WARNING
+  #   operator: ABOVE
+  #   threshold: 1
+  #   thresholdDuration: 300
+  #   thresholdOccurrences: ALL | AT_LEAST_ONCE
+
+# Loss of Signal Settings
+expiration:
+  # Close open violations if signal is lost (Default: false)
+  closeViolationsOnExpiration: true
+  # Open "Loss of Signal" violation if signal is lost (Default: false)
+  openViolationOnExpiration: false
+  # Time in seconds; Max value: 172800 (48hrs), null if closeViolationsOnExpiration and openViolationOnExpiration are both 'false'
+  expirationDuration: 300
+
+# Advanced Signal Settings
+# Duration of the time window used to evaluate the NRQL Condition
+signal:
+  # How long we wait for data that belongs in each aggregation window
+  aggregationDelay: 60 # seconds
+  # The method that determines when we consider an aggregation window to complete so that we can evaluate the signals for violations.
+  aggregationMethod: EVENT_FLOW
+  # How long we wait after each data point arrives to make sure we've processed the whole batch.
+  aggregationTimer: null # seconds
+  # Controls the duration of the time window used to evaluate the NRQL query
+  aggregationWindow: 60 # seconds; 30 seconds <= x < 15 minutes
+  # Option that determines the type of value that should be used to fill gaps (empty windows).
+  fillOption: NONE # defaults to STATIC
+  # If using the static fill option, this value is used for filling.
+  fillValue: null # default
+  # This setting gathers data in overlapping time windows to smooth the chart line, making it easier to spot trends.
+  slideBy: null # seconds
+  # Evaluation delay is how long we wait before we start evaluating a signal against the thresholds in this condition.
+  evaluationDelay: 60
+
+# OPTIONAL: URL of runbook to be sent with notification
+runbookUrl:
+
+# Duration after which a violation automatically closes
+# Time in seconds; 300 - 2592000 (Default: 86400 [1 day])
+violationTimeLimitSeconds: 21600
diff --git a/alert-policies/kubernetes-opentelemetry/StatefulsetPodsMissing.yaml b/alert-policies/kubernetes-opentelemetry/StatefulsetPodsMissing.yaml
new file mode 100644
index 0000000000..7452575bb6
--- /dev/null
+++ b/alert-policies/kubernetes-opentelemetry/StatefulsetPodsMissing.yaml
@@ -0,0 +1,73 @@
+name: Statefulset is missing Pods
+
+# Description and details
+description: |
+  Alert when Statefulset is missing Pods for > 5 minutes
+
+# Type of alert: BASELINE | STATIC
+type: STATIC
+
+# NRQL query
+nrql:
+  query: "from Metric latest(kube_statefulset_replicas) - latest(kube_statefulset_status_replicas_ready) where k8s.cluster.name in ('YOUR_CLUSTER_NAME') and k8s.namespace.name in ('YOUR_NAMESPACE_NAME') facet k8s.statefulset.name, k8s.namespace.name, k8s.cluster.name"
+
+# Direction in which baseline is set (Default: LOWER_ONLY)
+# baselineDirection: LOWER_ONLY | UPPER_AND_LOWER | UPPER_ONLY
+
+# Function used to aggregate the NRQL query value(s) for comparison to the terms.threshold (Default: SINGLE_VALUE)
+valueFunction: SINGLE_VALUE
+
+# List of Critical and Warning thresholds for the condition
+terms:
+  - priority: CRITICAL
+    # Operator used to compare against the threshold.
+    operator: ABOVE
+    # Value that triggers a violation
+    threshold: 0
+    # Time in seconds; 120 - 3600, must be a multiple of 60 for Baseline conditions
+    thresholdDuration: 300
+    # How many data points must be in violation for the duration
+    thresholdOccurrences: ALL
+
+  # Adding a Warning threshold is optional
+  # - priority: WARNING
+  #   operator: ABOVE
+  #   threshold: 1
+  #   thresholdDuration: 300
+  #   thresholdOccurrences: ALL | AT_LEAST_ONCE
+
+# Loss of Signal Settings
+expiration:
+  # Close open violations if signal is lost (Default: false)
+  closeViolationsOnExpiration: true
+  # Open "Loss of Signal" violation if signal is lost (Default: false)
+  openViolationOnExpiration: false
+  # Time in seconds; Max value: 172800 (48hrs), null if closeViolationsOnExpiration and openViolationOnExpiration are both 'false'
+  expirationDuration: 300
+
+# Advanced Signal Settings
+# Duration of the time window used to evaluate the NRQL Condition
+signal:
+  # How long we wait for data that belongs in each aggregation window
+  aggregationDelay: 60 # seconds
+  # The method that determines when we consider an aggregation window to complete so that we can evaluate the signals for violations.
+  aggregationMethod: EVENT_FLOW
+  # How long we wait after each data point arrives to make sure we've processed the whole batch.
+  aggregationTimer: null # seconds
+  # Controls the duration of the time window used to evaluate the NRQL query
+  aggregationWindow: 60 # seconds; 30 seconds <= x < 15 minutes
+  # Option that determines the type of value that should be used to fill gaps (empty windows).
+  fillOption: NONE # defaults to STATIC
+  # If using the static fill option, this value is used for filling.
+  fillValue: null # default
+  # This setting gathers data in overlapping time windows to smooth the chart line, making it easier to spot trends.
+  slideBy: null # seconds
+  # Evaluation delay is how long we wait before we start evaluating a signal against the thresholds in this condition.
+  evaluationDelay: 60
+
+# OPTIONAL: URL of runbook to be sent with notification
+runbookUrl:
+
+# Duration after which a violation automatically closes
+# Time in seconds; 300 - 2592000 (Default: 86400 [1 day])
+violationTimeLimitSeconds: 21600
diff --git a/quickstarts/kubernetes-opentelemetry/config.yml b/quickstarts/kubernetes-opentelemetry/config.yml
new file mode 100644
index 0000000000..0a2b17214f
--- /dev/null
+++ b/quickstarts/kubernetes-opentelemetry/config.yml
@@ -0,0 +1,54 @@
+slug: kubernetes-opentelemetry
+title: Kubernetes (OpenTelemetry)
+description: |
+  ## Why monitor Kubernetes?
+
+  Kubernetes is an open-source system for automating deployment, scaling, and, management of containerized applications. The New Relic Kubernetes monitoring quickstart gives you visibility into your Kubernetes clusters and workloads in minutes, whether your clusters are hosted on-premises or in the cloud.
+
+  ### Kubernetes quickstart highlights
+
+  The New Relic Kubernetes quickstart uses dashboards to proactively monitor your metrics, like:
+
+  - resources used
+  - number of K8s objects
+  - namespaces per cluster
+  - pods by namespace
+  - container cpu usage
+  - container restarts
+  - missing pods by deployment
+  - node resource consumption, and more.
+
+  This quickstart is also compatible with on-host integrations like:
+
+  - Cassandra
+  - MySQL
+  - Apache, and more.
+
+  ### New Relic + Kubernetes = Optimum performance monitoring
+
+  The [New Relic Kubernetes](https://docs.newrelic.com/docs/integrations/kubernetes-integration/installation/kubernetes-integration-install-configure/) quickstart has multiple components that work together to give you end-to-end observability across your clusters. While you have the flexibility to deploy the components that you prefer, to achieve full observability, you need to install the complete package to monitor all metrics. Use our quickstart to generate a Kubernetes manifest and add Pixie for more fine-grained telemetry data. You can also do the installation with Pixie for fine-grained telemetry data.
+  Our quickstart monitors the aggregated core and memory usage across all nodes in your cluster. This allows you to meet resource requirements for optimal application performance. It also empowers you to track resource consumption, find pods that aren't running, monitor disk usage, and troubleshoot container restarts. The New Relic Kubernetes integration has dashboards and a cluster explorer that provide a multi-dimensional representation of a Kubernetes cluster from which you can explore your namespaces, deployments, nodes, pods, containers, and applications. Download the New Relic Kubernetes quickstart today to gain instant visibility into your Kubernetes services, clusters and workloads in minutes.
+summary: |
+  Monitoring Kubernetes is crucial to gain instant visibility into Kubernetes clusters and workloads. Download New Relic Kubernetes quickstart to proactively monitor Kubernetes cluster health and capacity.
+level: New Relic
+authors:
+  - New Relic
+documentation:
+  - name: Kubernetes installation docs
+    description: |
+      Kubernetes is an open-source container-orchestration system for automating
+      computer application deployment, scaling, and management.
+    url: >-
+      https://docs.newrelic.com/docs/integrations/host-integrations/host-integrations-list/kubernetes-monitoring-integration
+dataSourceIds:
+  - kubernetes
+keywords:
+  - kubernetes
+  - containers
+  - pixie
+  - k8s
+  - opentelemetry
+dashboards:
+  - kubernetes
+alertPolicies:
+  - kubernetes-opentelemetry
diff --git a/quickstarts/kubernetes-opentelemetry/logo.svg b/quickstarts/kubernetes-opentelemetry/logo.svg
new file mode 100644
index 0000000000..1efad8e7a6
--- /dev/null
+++ b/quickstarts/kubernetes-opentelemetry/logo.svg
@@ -0,0 +1 @@
+<svg height="198" viewBox="0 0 200 198" width="200" xmlns="http://www.w3.org/2000/svg"><path d="m98.265625 1.441406c-54.269531 0-98.265625 43.933594-98.265625 98.132813 0 54.199221 43.996094 98.136721 98.265625 98.136721 54.269535 0 98.265625-43.9375 98.265625-98.136721 0-54.199219-43.99609-98.132813-98.265625-98.132813zm0 183.667964c-15.4375 0-27.957031-10.30078-27.957031-23.0039h55.917966c0 12.70312-12.51953 23.0039-27.960935 23.0039zm46.179685-30.62109h-92.363279v-16.72656h92.367189v16.72656zm-.33203-25.33594h-91.765624c-.308594-.35156-.621094-.69922-.914062-1.05468-9.453125-11.46485-11.679688-17.44922-13.84375-23.55078-.03516-.19922 11.464844 2.34765 19.621094 4.17968 0 0 4.195312.97266 10.332031 2.08985-5.890625-6.89844-9.390625-15.664066-9.390625-24.625004 0-19.671875 15.109375-36.863281 9.660156-50.757812 5.304688.433594 10.976562 11.183594 11.359375 27.988281 5.640625-7.78125 8-21.996094 8-30.710937 0-9.019532 5.953125-19.503907 11.90625-19.859376-5.304687 8.734376 1.378905 16.226563 7.316405 34.808594 2.23047 6.976563 1.94531 18.722656 3.66406 26.171875.57422-15.472656 3.23438-38.042969 13.0625-45.835937-4.33593 9.8125.64063 22.09375 4.04688 27.996094 5.49219 9.527343 8.82031 16.742187 8.82031 30.390624 0 9.152344-3.38281 17.769528-9.08984 24.503908 6.48828-1.21875 10.96875-2.3125 10.96875-2.3125l21.07422-4.10547c0-.004-3.0625 12.57422-14.82813 24.68359zm0 0" fill="#e6512b" transform="matrix(.92315881 0 0 .92315881 7.550848 7.651551)"/></svg>
\ No newline at end of file

From da8ce23e60212f847135836220bb908cb7197ca8 Mon Sep 17 00:00:00 2001
From: Doua Vue <dvue@newrelic.com>
Date: Mon, 7 Oct 2024 14:42:47 -0500
Subject: [PATCH 02/10] feat: Add datasource for k8s otel

---
 data-sources/kubernetes-opentelemetry/config.yml |  9 +++++++++
 data-sources/kubernetes-opentelemetry/logo.svg   |  1 +
 quickstarts/kubernetes-opentelemetry/config.yml  | 12 +++++-------
 3 files changed, 15 insertions(+), 7 deletions(-)
 create mode 100644 data-sources/kubernetes-opentelemetry/config.yml
 create mode 100644 data-sources/kubernetes-opentelemetry/logo.svg

diff --git a/data-sources/kubernetes-opentelemetry/config.yml b/data-sources/kubernetes-opentelemetry/config.yml
new file mode 100644
index 0000000000..2cf845d05d
--- /dev/null
+++ b/data-sources/kubernetes-opentelemetry/config.yml
@@ -0,0 +1,9 @@
+id: kubernetes-opentelemetry
+displayName: Kubernetes (OpenTelemetry)
+description: |
+  Manage telemetry data coming into New Relic.
+install:
+  primary:
+    link:
+      url: https://docs.newrelic.com/docs/kubernetes-pixie/kubernetes-integration/installation/k8s-otel/#install
+icon: logo.png
diff --git a/data-sources/kubernetes-opentelemetry/logo.svg b/data-sources/kubernetes-opentelemetry/logo.svg
new file mode 100644
index 0000000000..e33c0ab527
--- /dev/null
+++ b/data-sources/kubernetes-opentelemetry/logo.svg
@@ -0,0 +1 @@
+<svg height="200" viewBox="0 0 200 200" width="200" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink"><filter id="a" height="100%" width="100%" x="0%" y="0%"><feColorMatrix in="SourceGraphic" type="matrix" values="0 0 0 0 1 0 0 0 0 1 0 0 0 0 1 0 0 0 1 0"/></filter><mask id="b"><g filter="url(#a)"><image height="200" width="200" xlink:href="data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAAMgAAADICAIAAAAiOjnJAAAABmJLR0QA/wD/AP+gvaeTAAAAiklEQVR4nO3BAQEAAACCIP+vbkhAAQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAADwYNWXAAG9rB+hAAAAAElFTkSuQmCC"/></g></mask><clipPath id="c"><path d="m0 0h200v200h-200z"/></clipPath><g clip-path="url(#c)" mask="url(#b)"><path d="m168.753906 54.582031c-.953125-3.050781-3.242187-5.527343-6.101562-7.054687l-58.128906-27.824219c-1.523438-.761719-3.238282-.953125-4.765626-.953125-1.523437 0-3.238281 0-4.761718.382812l-58.132813 28.015626c-2.859375 1.332031-4.953125 3.8125-5.714843 7.050781l-14.296876 62.703125c-.570312 3.242187.191407 6.480468 2.097657 9.148437l40.214843 49.746094c2.285157 2.285156 5.527344 3.8125 8.765626 4.003906h64.039062c3.429688.378907 6.671875-1.144531 8.765625-4.003906l40.214844-49.746094c1.90625-2.667969 2.671875-5.90625 2.289062-9.148437zm0 0" fill="#326de6"/><path d="m159.796875 114.425781c-.191406 0-.382813 0-.382813-.191406 0-.1875-.382812-.1875-.761718-.1875-.761719-.191406-1.523438-.191406-2.289063-.191406-.378906 0-.761719 0-1.140625-.191407h-.191406c-2.097656-.191406-4.382812-.570312-6.480469-1.144531-.570312-.191406-1.144531-.761719-1.335937-1.332031l-1.523438-.382812c.761719-5.527344.382813-11.246094-.761718-16.769532-1.335938-5.527344-3.621094-10.867187-6.671876-15.628906l1.144532-1.144531v-.191407c0-.570312.191406-1.332031.570312-1.714843 1.714844-1.523438 3.433594-2.667969 5.339844-3.8125.378906-.191407.761719-.378907 1.140625-.570313.761719-.382812 1.335937-.761718 2.097656-1.144531.191407-.191406.382813-.191406.570313-.382813.191406-.1875 0-.1875 0-.378906 1.714844-1.335937 2.097656-3.621094.765625-5.335937-.574219-.761719-1.71875-1.335938-2.671875-1.335938s-1.902344.382813-2.667969.953125l-.1875.191406c-.191406.191407-.382813.382813-.574219.382813-.570312.570313-1.144531 1.140625-1.523437 1.714844-.191407.378906-.574219.570312-.761719.761719-1.335938 1.523437-3.050781 3.046874-4.765625 4.191406-.382813.191406-.761719.382812-1.144531.382812-.191406 0-.570313 0-.761719-.191406h-.191406l-1.523438.953125c-1.523437-1.523437-3.242187-3.050781-4.765625-4.574219-7.050781-5.527344-15.820312-8.957031-24.777344-9.910156l-.191406-1.527344v.191406c-.570312-.378906-.761718-.953124-.953125-1.523437 0-2.097656 0-4.191406.382813-6.480469v-.191406c0-.378906.191406-.761719.191406-1.140625.191406-.765625.191406-1.527344.378906-2.289063v-1.144531c.191406-1.90625-1.332031-3.8125-3.238281-4-1.144531-.191406-2.285156.378907-3.238281 1.332031-.765625.761719-1.144532 1.714844-1.144532 2.667969v.953125c0 .761719.191407 1.527344.378907 2.289063.191406.378906.191406.761719.191406 1.140625v.191406c.382813 2.097656.382813 4.195312.382813 6.480469-.191407.574219-.382813 1.144531-.953126 1.523437v.382813l-.191406 1.523437c-2.097656.191406-4.191406.574219-6.480468.953125-8.957032 1.90625-17.152344 6.671875-23.441407 13.34375l-1.144531-.761719h-.191406c-.191406 0-.378906.1875-.761719.1875-.378906 0-.761719-.1875-1.144531-.378906-1.714844-1.335937-3.429688-2.859375-4.761719-4.382812-.191406-.382813-.574219-.574219-.765625-.765625-.570312-.570313-.953125-1.140625-1.523438-1.714844-.191406-.1875-.382812-.1875-.570312-.378906-.191406-.191407-.191406-.191407-.191406-.191407-.761719-.570312-1.714844-.953124-2.667969-.953124-1.144531 0-2.097656.382812-2.667969 1.335937-1.144531 1.714844-.761718 4 .761719 5.335937.191406 0 .191406.1875.191406.1875s.378907.382813.570313.382813c.570312.382813 1.335937.761719 2.097656 1.144531.378906.191406.761719.378906 1.144531.570313 1.902344 1.144531 3.808594 2.289062 5.335938 3.8125.378906.382812.761719 1.144531.570312 1.714843v-.191406l1.144531 1.144532c-.191406.382812-.382812.570312-.574218.953124-5.90625 9.339844-8.382813 20.394532-6.667969 31.257813l-1.527344.378906c0 .191407-.1875.191407-.1875.191407-.191406.574218-.765625.953124-1.335937 1.335937-2.097656.570313-4.191406.953125-6.480469 1.140625-.378906 0-.761719 0-1.144531.191406-.761719 0-1.523438.191406-2.285156.191406-.191407 0-.382813.191407-.761719.191407-.191407 0-.191407 0-.382813.191406-2.097656.378906-3.429687 2.285156-3.050781 4.382813.382813 1.714843 2.097656 2.859374 3.8125 2.667968.382813 0 .574219 0 .953125-.191406.191406 0 .191406 0 .191406-.191406 0-.1875.570313 0 .761719 0 .761719-.1875 1.527344-.570313 2.097656-.761719.382813-.191406.761719-.378906 1.144531-.378906h.191407c2.09375-.765625 4-1.335938 6.289062-1.71875h.1875c.574219 0 1.144531.191406 1.527344.574219.191406 0 .191406.191406.191406.191406l1.714844-.191406c2.859375 8.765624 8.195313 16.582031 15.628906 22.296874 1.714844 1.335938 3.238281 2.480469 5.144531 3.433594l-.953124 1.332032c0 .191406.191406.191406.191406.191406.378906.570312.378906 1.332031.191406 1.90625-.765625 1.90625-1.90625 3.8125-3.050781 5.527344v.191406c-.191407.378906-.382813.570312-.761719.953125-.382812.378906-.761719 1.140625-1.335938 1.902343-.191406.191407-.191406.382813-.378906.574219 0 0 0 .191407-.191406.191407-.953125 1.90625-.191406 4.191406 1.523438 5.144531.382812.191406.953124.382812 1.335937.382812 1.523437 0 2.859375-.953125 3.621094-2.289062 0 0 0-.191407.1875-.191407 0-.191406.191406-.378906.382812-.570312.191407-.761719.570313-1.335938.761719-2.097656l.382812-1.144532c.570313-2.09375 1.523438-4 2.476563-5.90625.382813-.570312.953125-.953124 1.523437-1.144531.191407 0 .191407 0 .191407-.191406l.761719-1.523437c5.339843 2.097656 10.863281 3.050781 16.582031 3.050781 3.429687 0 6.863281-.382813 10.292969-1.335938 2.097656-.378906 4.191406-1.144531 6.097656-1.714843l.761718 1.335937c.191407 0 .191407 0 .191407.1875.574219.191406 1.144531.574219 1.523437 1.144531.953125 1.90625 1.90625 3.8125 2.480469 5.910156v.1875l.378906 1.144532c.191407.761718.382813 1.527344.765625 2.097656.1875.191406.1875.378906.378906.570312 0 0 0 .191407.191407.191407.761719 1.335937 2.097656 2.289062 3.621093 2.289062.570313 0 .953126-.191406 1.523438-.382812.761719-.382813 1.527344-1.144531 1.714844-2.097657.191406-.953124.191406-1.90625-.1875-2.859374 0-.1875-.191406-.1875-.191406-.1875 0-.191407-.191407-.382813-.382813-.574219-.378906-.761719-.761719-1.332031-1.332031-1.90625-.191406-.378907-.382813-.570313-.761719-.953125v-.378906c-1.335937-1.714844-2.289063-3.621094-3.050781-5.527344-.191406-.574219-.191406-1.335938.191406-1.90625 0-.191406.1875-.191406.1875-.191406l-.570312-1.523438c9.71875-5.910156 17.152343-15.058594 20.585937-25.921875l1.523437.191406c.191407 0 .191407-.191406.191407-.191406.378906-.378906.953125-.570313 1.523437-.570313h.191406c2.097657.378907 4.191407.953126 6.097657 1.714844h.191406c.378906.191406.761719.382813 1.144531.382813.761719.378906 1.332032.761719 2.09375.953125.191406 0 .382813.1875.765625.1875.1875 0 .1875 0 .378907.191406.382812.191406.570312.191406.953124.191406 1.714844 0 3.242188-1.144531 3.8125-2.667968-.191406-2.097657-1.714843-3.621094-3.429687-4.003907zm-55.082031-5.90625-5.144532 2.476563-5.148437-2.476563-1.332031-5.527343 3.621094-4.574219h5.714843l3.625 4.574219zm31.066406-12.390625c.953125 4.003906 1.144531 8.003906.761719 12.007813l-18.105469-5.144531c-1.714844-.382813-2.667969-2.097657-2.289062-3.8125.191406-.570313.382812-.953126.765624-1.335938l14.292969-12.957031c2.097657 3.429687 3.621094 7.242187 4.574219 11.242187zm-10.292969-18.296875-15.628906 11.054688c-1.332031.761719-3.238281.574219-4.191406-.761719-.382813-.382812-.570313-.761719-.570313-1.335938l-1.144531-19.246093c8.386719.953125 15.816406 4.574219 21.535156 10.289062zm-34.496093-9.71875 3.8125-.761719-.953126 19.058594c0 1.714844-1.523437 3.050782-3.242187 3.050782-.570313 0-.953125-.191407-1.523437-.382813l-15.820313-11.246094c4.957031-4.765625 11.054687-8.195312 17.726563-9.71875zm-23.253907 16.773438 14.105469 12.578125c1.335938 1.144531 1.523438 3.046875.382812 4.382812-.382812.570313-.765624.761719-1.527343.953125l-18.484375 5.335938c-.574219-8.003907 1.332031-16.199219 5.523437-23.25zm-3.238281 32.207031 18.867188-3.238281c1.527343 0 3.050781.953125 3.242187 2.476562.191406.570313.191406 1.335938-.191406 1.90625l-7.242188 17.535157c-6.671875-4.382813-12.007812-11.054688-14.675781-18.679688zm43.265625 23.632812c-2.667969.574219-5.339844.953126-8.195313.953126-4.003906 0-8.195312-.761719-12.007812-1.90625l9.339844-16.960938c.953125-1.144531 2.476562-1.523438 3.808594-.761719.574218.378907.953124.761719 1.527343 1.332031l9.148438 16.582032c-1.144531.191406-2.289063.382812-3.621094.761718zm23.25-16.578124c-2.859375 4.574218-6.859375 8.574218-11.433594 11.433593l-7.433593-17.914062c-.382813-1.527344.378906-3.050781 1.714843-3.621094.570313-.191406 1.144531-.382813 1.714844-.382813l19.058594 3.238282c-.953125 2.671875-2.09375 5.148437-3.621094 7.246094zm0 0" fill="#fff"/></g></svg>
\ No newline at end of file
diff --git a/quickstarts/kubernetes-opentelemetry/config.yml b/quickstarts/kubernetes-opentelemetry/config.yml
index 0a2b17214f..2900593745 100644
--- a/quickstarts/kubernetes-opentelemetry/config.yml
+++ b/quickstarts/kubernetes-opentelemetry/config.yml
@@ -5,7 +5,7 @@ description: |
 
   Kubernetes is an open-source system for automating deployment, scaling, and, management of containerized applications. The New Relic Kubernetes monitoring quickstart gives you visibility into your Kubernetes clusters and workloads in minutes, whether your clusters are hosted on-premises or in the cloud.
 
-  ### Kubernetes quickstart highlights
+  ### Kubernetes (OpenTelemetry) quickstart highlights
 
   The New Relic Kubernetes quickstart uses dashboards to proactively monitor your metrics, like:
 
@@ -26,7 +26,7 @@ description: |
 
   ### New Relic + Kubernetes = Optimum performance monitoring
 
-  The [New Relic Kubernetes](https://docs.newrelic.com/docs/integrations/kubernetes-integration/installation/kubernetes-integration-install-configure/) quickstart has multiple components that work together to give you end-to-end observability across your clusters. While you have the flexibility to deploy the components that you prefer, to achieve full observability, you need to install the complete package to monitor all metrics. Use our quickstart to generate a Kubernetes manifest and add Pixie for more fine-grained telemetry data. You can also do the installation with Pixie for fine-grained telemetry data.
+  The [New Relic Kubernetes (OpenTelemetry)](https://docs.newrelic.com/docs/integrations/kubernetes-integration/installation/kubernetes-integration-install-configure/) quickstart has multiple components that work together to give you end-to-end observability across your clusters. While you have the flexibility to deploy the components that you prefer, to achieve full observability, you need to install the complete package to monitor all metrics. Use our quickstart to generate a Kubernetes manifest and add Pixie for more fine-grained telemetry data. You can also do the installation with Pixie for fine-grained telemetry data.
   Our quickstart monitors the aggregated core and memory usage across all nodes in your cluster. This allows you to meet resource requirements for optimal application performance. It also empowers you to track resource consumption, find pods that aren't running, monitor disk usage, and troubleshoot container restarts. The New Relic Kubernetes integration has dashboards and a cluster explorer that provide a multi-dimensional representation of a Kubernetes cluster from which you can explore your namespaces, deployments, nodes, pods, containers, and applications. Download the New Relic Kubernetes quickstart today to gain instant visibility into your Kubernetes services, clusters and workloads in minutes.
 summary: |
   Monitoring Kubernetes is crucial to gain instant visibility into Kubernetes clusters and workloads. Download New Relic Kubernetes quickstart to proactively monitor Kubernetes cluster health and capacity.
@@ -34,21 +34,19 @@ level: New Relic
 authors:
   - New Relic
 documentation:
-  - name: Kubernetes installation docs
+  - name: Kubernetes (Opentelemetry) installation docs
     description: |
       Kubernetes is an open-source container-orchestration system for automating
       computer application deployment, scaling, and management.
     url: >-
-      https://docs.newrelic.com/docs/integrations/host-integrations/host-integrations-list/kubernetes-monitoring-integration
+      https://docs.newrelic.com/docs/kubernetes-pixie/kubernetes-integration/installation/k8s-otel/#install
 dataSourceIds:
-  - kubernetes
+  - kubernetes-opentelemetry
 keywords:
   - kubernetes
   - containers
   - pixie
   - k8s
   - opentelemetry
-dashboards:
-  - kubernetes
 alertPolicies:
   - kubernetes-opentelemetry

From ef5d5bfe659194132e3a95888f157f0f0c638d27 Mon Sep 17 00:00:00 2001
From: Doua Vue <dvue@newrelic.com>
Date: Tue, 8 Oct 2024 08:43:15 -0500
Subject: [PATCH 03/10] fix: Update image extension

---
 data-sources/kubernetes-opentelemetry/config.yml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/data-sources/kubernetes-opentelemetry/config.yml b/data-sources/kubernetes-opentelemetry/config.yml
index 2cf845d05d..371748f75a 100644
--- a/data-sources/kubernetes-opentelemetry/config.yml
+++ b/data-sources/kubernetes-opentelemetry/config.yml
@@ -6,4 +6,4 @@ install:
   primary:
     link:
       url: https://docs.newrelic.com/docs/kubernetes-pixie/kubernetes-integration/installation/k8s-otel/#install
-icon: logo.png
+icon: logo.svg

From d0572acb07e1a4e6d31430b70077855d39c885a3 Mon Sep 17 00:00:00 2001
From: Doua Vue <dvue@newrelic.com>
Date: Tue, 8 Oct 2024 08:47:06 -0500
Subject: [PATCH 04/10] fix: Update image for k8s-otel quickstart

---
 quickstarts/kubernetes-opentelemetry/logo.svg | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/quickstarts/kubernetes-opentelemetry/logo.svg b/quickstarts/kubernetes-opentelemetry/logo.svg
index 1efad8e7a6..e33c0ab527 100644
--- a/quickstarts/kubernetes-opentelemetry/logo.svg
+++ b/quickstarts/kubernetes-opentelemetry/logo.svg
@@ -1 +1 @@
-<svg height="198" viewBox="0 0 200 198" width="200" xmlns="http://www.w3.org/2000/svg"><path d="m98.265625 1.441406c-54.269531 0-98.265625 43.933594-98.265625 98.132813 0 54.199221 43.996094 98.136721 98.265625 98.136721 54.269535 0 98.265625-43.9375 98.265625-98.136721 0-54.199219-43.99609-98.132813-98.265625-98.132813zm0 183.667964c-15.4375 0-27.957031-10.30078-27.957031-23.0039h55.917966c0 12.70312-12.51953 23.0039-27.960935 23.0039zm46.179685-30.62109h-92.363279v-16.72656h92.367189v16.72656zm-.33203-25.33594h-91.765624c-.308594-.35156-.621094-.69922-.914062-1.05468-9.453125-11.46485-11.679688-17.44922-13.84375-23.55078-.03516-.19922 11.464844 2.34765 19.621094 4.17968 0 0 4.195312.97266 10.332031 2.08985-5.890625-6.89844-9.390625-15.664066-9.390625-24.625004 0-19.671875 15.109375-36.863281 9.660156-50.757812 5.304688.433594 10.976562 11.183594 11.359375 27.988281 5.640625-7.78125 8-21.996094 8-30.710937 0-9.019532 5.953125-19.503907 11.90625-19.859376-5.304687 8.734376 1.378905 16.226563 7.316405 34.808594 2.23047 6.976563 1.94531 18.722656 3.66406 26.171875.57422-15.472656 3.23438-38.042969 13.0625-45.835937-4.33593 9.8125.64063 22.09375 4.04688 27.996094 5.49219 9.527343 8.82031 16.742187 8.82031 30.390624 0 9.152344-3.38281 17.769528-9.08984 24.503908 6.48828-1.21875 10.96875-2.3125 10.96875-2.3125l21.07422-4.10547c0-.004-3.0625 12.57422-14.82813 24.68359zm0 0" fill="#e6512b" transform="matrix(.92315881 0 0 .92315881 7.550848 7.651551)"/></svg>
\ No newline at end of file
+<svg height="200" viewBox="0 0 200 200" width="200" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink"><filter id="a" height="100%" width="100%" x="0%" y="0%"><feColorMatrix in="SourceGraphic" type="matrix" values="0 0 0 0 1 0 0 0 0 1 0 0 0 0 1 0 0 0 1 0"/></filter><mask id="b"><g filter="url(#a)"><image height="200" width="200" xlink:href="data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAAMgAAADICAIAAAAiOjnJAAAABmJLR0QA/wD/AP+gvaeTAAAAiklEQVR4nO3BAQEAAACCIP+vbkhAAQAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAADwYNWXAAG9rB+hAAAAAElFTkSuQmCC"/></g></mask><clipPath id="c"><path d="m0 0h200v200h-200z"/></clipPath><g clip-path="url(#c)" mask="url(#b)"><path d="m168.753906 54.582031c-.953125-3.050781-3.242187-5.527343-6.101562-7.054687l-58.128906-27.824219c-1.523438-.761719-3.238282-.953125-4.765626-.953125-1.523437 0-3.238281 0-4.761718.382812l-58.132813 28.015626c-2.859375 1.332031-4.953125 3.8125-5.714843 7.050781l-14.296876 62.703125c-.570312 3.242187.191407 6.480468 2.097657 9.148437l40.214843 49.746094c2.285157 2.285156 5.527344 3.8125 8.765626 4.003906h64.039062c3.429688.378907 6.671875-1.144531 8.765625-4.003906l40.214844-49.746094c1.90625-2.667969 2.671875-5.90625 2.289062-9.148437zm0 0" fill="#326de6"/><path d="m159.796875 114.425781c-.191406 0-.382813 0-.382813-.191406 0-.1875-.382812-.1875-.761718-.1875-.761719-.191406-1.523438-.191406-2.289063-.191406-.378906 0-.761719 0-1.140625-.191407h-.191406c-2.097656-.191406-4.382812-.570312-6.480469-1.144531-.570312-.191406-1.144531-.761719-1.335937-1.332031l-1.523438-.382812c.761719-5.527344.382813-11.246094-.761718-16.769532-1.335938-5.527344-3.621094-10.867187-6.671876-15.628906l1.144532-1.144531v-.191407c0-.570312.191406-1.332031.570312-1.714843 1.714844-1.523438 3.433594-2.667969 5.339844-3.8125.378906-.191407.761719-.378907 1.140625-.570313.761719-.382812 1.335937-.761718 2.097656-1.144531.191407-.191406.382813-.191406.570313-.382813.191406-.1875 0-.1875 0-.378906 1.714844-1.335937 2.097656-3.621094.765625-5.335937-.574219-.761719-1.71875-1.335938-2.671875-1.335938s-1.902344.382813-2.667969.953125l-.1875.191406c-.191406.191407-.382813.382813-.574219.382813-.570312.570313-1.144531 1.140625-1.523437 1.714844-.191407.378906-.574219.570312-.761719.761719-1.335938 1.523437-3.050781 3.046874-4.765625 4.191406-.382813.191406-.761719.382812-1.144531.382812-.191406 0-.570313 0-.761719-.191406h-.191406l-1.523438.953125c-1.523437-1.523437-3.242187-3.050781-4.765625-4.574219-7.050781-5.527344-15.820312-8.957031-24.777344-9.910156l-.191406-1.527344v.191406c-.570312-.378906-.761718-.953124-.953125-1.523437 0-2.097656 0-4.191406.382813-6.480469v-.191406c0-.378906.191406-.761719.191406-1.140625.191406-.765625.191406-1.527344.378906-2.289063v-1.144531c.191406-1.90625-1.332031-3.8125-3.238281-4-1.144531-.191406-2.285156.378907-3.238281 1.332031-.765625.761719-1.144532 1.714844-1.144532 2.667969v.953125c0 .761719.191407 1.527344.378907 2.289063.191406.378906.191406.761719.191406 1.140625v.191406c.382813 2.097656.382813 4.195312.382813 6.480469-.191407.574219-.382813 1.144531-.953126 1.523437v.382813l-.191406 1.523437c-2.097656.191406-4.191406.574219-6.480468.953125-8.957032 1.90625-17.152344 6.671875-23.441407 13.34375l-1.144531-.761719h-.191406c-.191406 0-.378906.1875-.761719.1875-.378906 0-.761719-.1875-1.144531-.378906-1.714844-1.335937-3.429688-2.859375-4.761719-4.382812-.191406-.382813-.574219-.574219-.765625-.765625-.570312-.570313-.953125-1.140625-1.523438-1.714844-.191406-.1875-.382812-.1875-.570312-.378906-.191406-.191407-.191406-.191407-.191406-.191407-.761719-.570312-1.714844-.953124-2.667969-.953124-1.144531 0-2.097656.382812-2.667969 1.335937-1.144531 1.714844-.761718 4 .761719 5.335937.191406 0 .191406.1875.191406.1875s.378907.382813.570313.382813c.570312.382813 1.335937.761719 2.097656 1.144531.378906.191406.761719.378906 1.144531.570313 1.902344 1.144531 3.808594 2.289062 5.335938 3.8125.378906.382812.761719 1.144531.570312 1.714843v-.191406l1.144531 1.144532c-.191406.382812-.382812.570312-.574218.953124-5.90625 9.339844-8.382813 20.394532-6.667969 31.257813l-1.527344.378906c0 .191407-.1875.191407-.1875.191407-.191406.574218-.765625.953124-1.335937 1.335937-2.097656.570313-4.191406.953125-6.480469 1.140625-.378906 0-.761719 0-1.144531.191406-.761719 0-1.523438.191406-2.285156.191406-.191407 0-.382813.191407-.761719.191407-.191407 0-.191407 0-.382813.191406-2.097656.378906-3.429687 2.285156-3.050781 4.382813.382813 1.714843 2.097656 2.859374 3.8125 2.667968.382813 0 .574219 0 .953125-.191406.191406 0 .191406 0 .191406-.191406 0-.1875.570313 0 .761719 0 .761719-.1875 1.527344-.570313 2.097656-.761719.382813-.191406.761719-.378906 1.144531-.378906h.191407c2.09375-.765625 4-1.335938 6.289062-1.71875h.1875c.574219 0 1.144531.191406 1.527344.574219.191406 0 .191406.191406.191406.191406l1.714844-.191406c2.859375 8.765624 8.195313 16.582031 15.628906 22.296874 1.714844 1.335938 3.238281 2.480469 5.144531 3.433594l-.953124 1.332032c0 .191406.191406.191406.191406.191406.378906.570312.378906 1.332031.191406 1.90625-.765625 1.90625-1.90625 3.8125-3.050781 5.527344v.191406c-.191407.378906-.382813.570312-.761719.953125-.382812.378906-.761719 1.140625-1.335938 1.902343-.191406.191407-.191406.382813-.378906.574219 0 0 0 .191407-.191406.191407-.953125 1.90625-.191406 4.191406 1.523438 5.144531.382812.191406.953124.382812 1.335937.382812 1.523437 0 2.859375-.953125 3.621094-2.289062 0 0 0-.191407.1875-.191407 0-.191406.191406-.378906.382812-.570312.191407-.761719.570313-1.335938.761719-2.097656l.382812-1.144532c.570313-2.09375 1.523438-4 2.476563-5.90625.382813-.570312.953125-.953124 1.523437-1.144531.191407 0 .191407 0 .191407-.191406l.761719-1.523437c5.339843 2.097656 10.863281 3.050781 16.582031 3.050781 3.429687 0 6.863281-.382813 10.292969-1.335938 2.097656-.378906 4.191406-1.144531 6.097656-1.714843l.761718 1.335937c.191407 0 .191407 0 .191407.1875.574219.191406 1.144531.574219 1.523437 1.144531.953125 1.90625 1.90625 3.8125 2.480469 5.910156v.1875l.378906 1.144532c.191407.761718.382813 1.527344.765625 2.097656.1875.191406.1875.378906.378906.570312 0 0 0 .191407.191407.191407.761719 1.335937 2.097656 2.289062 3.621093 2.289062.570313 0 .953126-.191406 1.523438-.382812.761719-.382813 1.527344-1.144531 1.714844-2.097657.191406-.953124.191406-1.90625-.1875-2.859374 0-.1875-.191406-.1875-.191406-.1875 0-.191407-.191407-.382813-.382813-.574219-.378906-.761719-.761719-1.332031-1.332031-1.90625-.191406-.378907-.382813-.570313-.761719-.953125v-.378906c-1.335937-1.714844-2.289063-3.621094-3.050781-5.527344-.191406-.574219-.191406-1.335938.191406-1.90625 0-.191406.1875-.191406.1875-.191406l-.570312-1.523438c9.71875-5.910156 17.152343-15.058594 20.585937-25.921875l1.523437.191406c.191407 0 .191407-.191406.191407-.191406.378906-.378906.953125-.570313 1.523437-.570313h.191406c2.097657.378907 4.191407.953126 6.097657 1.714844h.191406c.378906.191406.761719.382813 1.144531.382813.761719.378906 1.332032.761719 2.09375.953125.191406 0 .382813.1875.765625.1875.1875 0 .1875 0 .378907.191406.382812.191406.570312.191406.953124.191406 1.714844 0 3.242188-1.144531 3.8125-2.667968-.191406-2.097657-1.714843-3.621094-3.429687-4.003907zm-55.082031-5.90625-5.144532 2.476563-5.148437-2.476563-1.332031-5.527343 3.621094-4.574219h5.714843l3.625 4.574219zm31.066406-12.390625c.953125 4.003906 1.144531 8.003906.761719 12.007813l-18.105469-5.144531c-1.714844-.382813-2.667969-2.097657-2.289062-3.8125.191406-.570313.382812-.953126.765624-1.335938l14.292969-12.957031c2.097657 3.429687 3.621094 7.242187 4.574219 11.242187zm-10.292969-18.296875-15.628906 11.054688c-1.332031.761719-3.238281.574219-4.191406-.761719-.382813-.382812-.570313-.761719-.570313-1.335938l-1.144531-19.246093c8.386719.953125 15.816406 4.574219 21.535156 10.289062zm-34.496093-9.71875 3.8125-.761719-.953126 19.058594c0 1.714844-1.523437 3.050782-3.242187 3.050782-.570313 0-.953125-.191407-1.523437-.382813l-15.820313-11.246094c4.957031-4.765625 11.054687-8.195312 17.726563-9.71875zm-23.253907 16.773438 14.105469 12.578125c1.335938 1.144531 1.523438 3.046875.382812 4.382812-.382812.570313-.765624.761719-1.527343.953125l-18.484375 5.335938c-.574219-8.003907 1.332031-16.199219 5.523437-23.25zm-3.238281 32.207031 18.867188-3.238281c1.527343 0 3.050781.953125 3.242187 2.476562.191406.570313.191406 1.335938-.191406 1.90625l-7.242188 17.535157c-6.671875-4.382813-12.007812-11.054688-14.675781-18.679688zm43.265625 23.632812c-2.667969.574219-5.339844.953126-8.195313.953126-4.003906 0-8.195312-.761719-12.007812-1.90625l9.339844-16.960938c.953125-1.144531 2.476562-1.523438 3.808594-.761719.574218.378907.953124.761719 1.527343 1.332031l9.148438 16.582032c-1.144531.191406-2.289063.382812-3.621094.761718zm23.25-16.578124c-2.859375 4.574218-6.859375 8.574218-11.433594 11.433593l-7.433593-17.914062c-.382813-1.527344.378906-3.050781 1.714843-3.621094.570313-.191406 1.144531-.382813 1.714844-.382813l19.058594 3.238282c-.953125 2.671875-2.09375 5.148437-3.621094 7.246094zm0 0" fill="#fff"/></g></svg>
\ No newline at end of file

From 08de38e8256afa986992cf7fa157582ac7937b1d Mon Sep 17 00:00:00 2001
From: Doua Vue <dvue@newrelic.com>
Date: Wed, 9 Oct 2024 09:50:24 -0500
Subject: [PATCH 05/10] fix: Address CR feedback re nrql and configs

---
 .../kubernetes-opentelemetry/ContainerCPUThrottling.yaml        | 2 +-
 .../kubernetes-opentelemetry/ContainerHighMemUtil.yaml          | 2 +-
 .../kubernetes-opentelemetry/NodeHighAllocatableCPUUtil.yaml    | 2 +-
 .../kubernetes-opentelemetry/NodeHighAllocatableMemUtil.yaml    | 2 +-
 .../kubernetes-opentelemetry/NodeHighFSCapacityUtil.yaml        | 2 +-
 alert-policies/kubernetes-opentelemetry/NodeIsNotReady.yaml     | 2 +-
 alert-policies/kubernetes-opentelemetry/NodePodCapacity.yaml    | 2 +-
 .../kubernetes-opentelemetry/PodsFailingNamespace.yaml          | 2 +-
 .../kubernetes-opentelemetry/StatefulsetPodsMissing.yaml        | 2 +-
 9 files changed, 9 insertions(+), 9 deletions(-)

diff --git a/alert-policies/kubernetes-opentelemetry/ContainerCPUThrottling.yaml b/alert-policies/kubernetes-opentelemetry/ContainerCPUThrottling.yaml
index 896c786d39..6ef77428b7 100644
--- a/alert-policies/kubernetes-opentelemetry/ContainerCPUThrottling.yaml
+++ b/alert-policies/kubernetes-opentelemetry/ContainerCPUThrottling.yaml
@@ -22,7 +22,7 @@ terms:
     # Operator used to compare against the threshold.
     operator: ABOVE
     # Value that triggers a violation
-    threshold: 90
+    threshold: 25
     # Time in seconds; 120 - 3600, must be a multiple of 60 for Baseline conditions
     thresholdDuration: 300
     # How many data points must be in violation for the duration
diff --git a/alert-policies/kubernetes-opentelemetry/ContainerHighMemUtil.yaml b/alert-policies/kubernetes-opentelemetry/ContainerHighMemUtil.yaml
index fe3db565c0..20f68e6954 100644
--- a/alert-policies/kubernetes-opentelemetry/ContainerHighMemUtil.yaml
+++ b/alert-policies/kubernetes-opentelemetry/ContainerHighMemUtil.yaml
@@ -8,7 +8,7 @@ type: STATIC
 
 # NRQL query
 nrql:
-  query: "from Metric max(container_memory_working_set_bytes) / filter(max(kube_pod_container_resource_limits), where resource = 'memory') where k8s.cluster.name in ('YOUR_CLUSTER_NAME') and k8s.namespace.name in ('YOUR_NAMESPACE_NAME') facet k8s.container.name, k8s.pod.name, k8s.namespace.name, k8s.cluster.name"
+  query: "from Metric select max(container_memory_working_set_bytes) / filter(max(kube_pod_container_resource_limits), where resource = 'memory') where k8s.cluster.name in ('YOUR_CLUSTER_NAME') and k8s.namespace.name in ('YOUR_NAMESPACE_NAME') facet pod, container, k8s.namespace.name, k8s.cluster.name"
 
 # Direction in which baseline is set (Default: LOWER_ONLY)
 # baselineDirection: LOWER_ONLY | UPPER_AND_LOWER | UPPER_ONLY
diff --git a/alert-policies/kubernetes-opentelemetry/NodeHighAllocatableCPUUtil.yaml b/alert-policies/kubernetes-opentelemetry/NodeHighAllocatableCPUUtil.yaml
index ecf61d4fe2..400094e63f 100644
--- a/alert-policies/kubernetes-opentelemetry/NodeHighAllocatableCPUUtil.yaml
+++ b/alert-policies/kubernetes-opentelemetry/NodeHighAllocatableCPUUtil.yaml
@@ -8,7 +8,7 @@ type: STATIC
 
 # NRQL query
 nrql:
-  query: "from Metric select latest(k8s.node.cpu.utilization) where k8s.cluster.name in ('YOUR_CLUSTER_NAME') facet k8s.node.name, k8s.cluster.name"
+  query: "from Metric select average(k8s.node.cpu.utilization) * 100 where k8s.cluster.name in ('YOUR_CLUSTER_NAME') facet k8s.node.name, k8s.cluster.name"
 
 # Direction in which baseline is set (Default: LOWER_ONLY)
 # baselineDirection: LOWER_ONLY | UPPER_AND_LOWER | UPPER_ONLY
diff --git a/alert-policies/kubernetes-opentelemetry/NodeHighAllocatableMemUtil.yaml b/alert-policies/kubernetes-opentelemetry/NodeHighAllocatableMemUtil.yaml
index da0e55aa99..c34b683fae 100644
--- a/alert-policies/kubernetes-opentelemetry/NodeHighAllocatableMemUtil.yaml
+++ b/alert-policies/kubernetes-opentelemetry/NodeHighAllocatableMemUtil.yaml
@@ -8,7 +8,7 @@ type: STATIC
 
 # NRQL query
 nrql:
-  query: "from Metric select latest(k8s.node.memory.working_set) / filter(latest(kube_node_status_allocatable), WHERE resource = 'memory')  where k8s.cluster.name in ('YOUR_CLUSTER_NAME') facet k8s.node.name, k8s.cluster.name"
+  query: "from Metric select (average(k8s.node.memory.working_set) / filter(latest(kube_node_status_allocatable), WHERE resource = 'memory')) * 100 where k8s.cluster.name in ('YOUR_CLUSTER_NAME') facet k8s.node.name, k8s.cluster.name"
 
 # Direction in which baseline is set (Default: LOWER_ONLY)
 # baselineDirection: LOWER_ONLY | UPPER_AND_LOWER | UPPER_ONLY
diff --git a/alert-policies/kubernetes-opentelemetry/NodeHighFSCapacityUtil.yaml b/alert-policies/kubernetes-opentelemetry/NodeHighFSCapacityUtil.yaml
index a09b71d454..4c57ae6d0b 100644
--- a/alert-policies/kubernetes-opentelemetry/NodeHighFSCapacityUtil.yaml
+++ b/alert-policies/kubernetes-opentelemetry/NodeHighFSCapacityUtil.yaml
@@ -8,7 +8,7 @@ type: STATIC
 
 # NRQL query
 nrql:
-  query: "from Metric select max(k8s.node.filesystem.usage) / max(k8s.node.filesystem.capacity) where k8s.cluster.name in ('YOUR_CLUSTER_NAME') facet k8s.node.name, k8s.cluster.name"
+  query: "from Metric select (average(k8s.node.filesystem.usage) / average(k8s.node.filesystem.capacity)) * 100 where k8s.cluster.name in ('YOUR_CLUSTER_NAME') facet k8s.node.name, k8s.cluster.name"
 
 # Direction in which baseline is set (Default: LOWER_ONLY)
 # baselineDirection: LOWER_ONLY | UPPER_AND_LOWER | UPPER_ONLY
diff --git a/alert-policies/kubernetes-opentelemetry/NodeIsNotReady.yaml b/alert-policies/kubernetes-opentelemetry/NodeIsNotReady.yaml
index b46ee313d6..b64fd15328 100644
--- a/alert-policies/kubernetes-opentelemetry/NodeIsNotReady.yaml
+++ b/alert-policies/kubernetes-opentelemetry/NodeIsNotReady.yaml
@@ -9,7 +9,7 @@ type: STATIC
 
 # NRQL query
 nrql:
-  query: "from Metric if(latest(condition) = 'Ready', 0, 1) where k8s.cluster.name in ('YOUR_CLUSTER_NAME') facet k8s.node.name, k8s.cluster.name"
+  query: "from Metric select if(latest(condition) = 'Ready', 0, 1) where k8s.cluster.name in ('YOUR_CLUSTER_NAME') facet k8s.node.name, k8s.cluster.name"
 
 # Direction in which baseline is set (Default: LOWER_ONLY)
 # baselineDirection: LOWER_ONLY | UPPER_AND_LOWER | UPPER_ONLY
diff --git a/alert-policies/kubernetes-opentelemetry/NodePodCapacity.yaml b/alert-policies/kubernetes-opentelemetry/NodePodCapacity.yaml
index 09c20296fd..41026339b3 100644
--- a/alert-policies/kubernetes-opentelemetry/NodePodCapacity.yaml
+++ b/alert-policies/kubernetes-opentelemetry/NodePodCapacity.yaml
@@ -9,7 +9,7 @@ type: STATIC
 
 # NRQL query
 nrql:
-  query: "FROM Metric select filter(uniqueCount(k8s.pod.name), where phase = 'Running' AND (metricName = 'kube_pod_status_phase' AND kube_pod_status_phase ['latest'] = 1) and created_by_kind != 'Job' ) / filter(latest(kube_node_status_allocatable), WHERE resource = 'cpu' ) * 100 as 'Pod Capacity %' where k8s.node.name != '' and k8s.node.name is not null and k8s.cluster.name in ('YOUR_CLUSTER_NAME') facet k8s.node.name, k8s.cluster.name"
+  query: "FROM Metric select filter(uniqueCount(k8s.pod.name), where phase = 'Running' AND (metricName = 'kube_pod_status_phase' AND kube_pod_status_phase ['latest'] = 1) and created_by_kind != 'Job' ) / filter(latest(kube_node_status_allocatable), WHERE resource = 'pods' ) * 100 as 'Pod Capacity %' where k8s.cluster.name in ('YOUR_CLUSTER_NAME')"
 
 # Direction in which baseline is set (Default: LOWER_ONLY)
 # baselineDirection: LOWER_ONLY | UPPER_AND_LOWER | UPPER_ONLY
diff --git a/alert-policies/kubernetes-opentelemetry/PodsFailingNamespace.yaml b/alert-policies/kubernetes-opentelemetry/PodsFailingNamespace.yaml
index e8926f955c..17ad1daaef 100644
--- a/alert-policies/kubernetes-opentelemetry/PodsFailingNamespace.yaml
+++ b/alert-policies/kubernetes-opentelemetry/PodsFailingNamespace.yaml
@@ -23,7 +23,7 @@ terms:
     # Operator used to compare against the threshold.
     operator: ABOVE
     # Value that triggers a violation
-    threshold: 0
+    threshold: 5
     # Time in seconds; 120 - 3600, must be a multiple of 60 for Baseline conditions
     thresholdDuration: 300
     # How many data points must be in violation for the duration
diff --git a/alert-policies/kubernetes-opentelemetry/StatefulsetPodsMissing.yaml b/alert-policies/kubernetes-opentelemetry/StatefulsetPodsMissing.yaml
index 7452575bb6..0e666bae6c 100644
--- a/alert-policies/kubernetes-opentelemetry/StatefulsetPodsMissing.yaml
+++ b/alert-policies/kubernetes-opentelemetry/StatefulsetPodsMissing.yaml
@@ -9,7 +9,7 @@ type: STATIC
 
 # NRQL query
 nrql:
-  query: "from Metric latest(kube_statefulset_replicas) - latest(kube_statefulset_status_replicas_ready) where k8s.cluster.name in ('YOUR_CLUSTER_NAME') and k8s.namespace.name in ('YOUR_NAMESPACE_NAME') facet k8s.statefulset.name, k8s.namespace.name, k8s.cluster.name"
+  query: "from Metric select latest(kube_statefulset_replicas) - latest(kube_statefulset_status_replicas_ready) where k8s.cluster.name in ('YOUR_CLUSTER_NAME') and k8s.namespace.name in ('YOUR_NAMESPACE_NAME') facet k8s.statefulset.name, k8s.namespace.name, k8s.cluster.name"
 
 # Direction in which baseline is set (Default: LOWER_ONLY)
 # baselineDirection: LOWER_ONLY | UPPER_AND_LOWER | UPPER_ONLY

From 949697005e84bfb4e120b226bba593b1a1fa2918 Mon Sep 17 00:00:00 2001
From: rossfromwork <150628820+rossfromwork@users.noreply.github.com>
Date: Tue, 15 Oct 2024 20:16:13 +1100
Subject: [PATCH 06/10] Updated replication.master.slaves.Offset NRQL

Corrected NRQL used for Replication byte offset widget.

Changed from average(replication.master.slaves.Offset) to average('replication.master.slaves.Offset')
---
 dashboards/gcp-redis/gcp-redis.json | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/dashboards/gcp-redis/gcp-redis.json b/dashboards/gcp-redis/gcp-redis.json
index 4672c7c03e..3306d54db0 100644
--- a/dashboards/gcp-redis/gcp-redis.json
+++ b/dashboards/gcp-redis/gcp-redis.json
@@ -335,7 +335,7 @@
             "nrqlQueries": [
               {
                 "accountIds": [],
-                "query": "SELECT AVERAGE(replication.master.slaves.Offset) AS `Average Replication Byte Offset(Slaves)`, AVERAGE(replication.MasterReplOffset) AS `Average Replication Byte Offset(Master)` FROM GcpRedisInstanceSample WHERE (`provider` = 'GcpRedisInstance') FACET slave TIMESERIES AUTO"
+                "query": "SELECT AVERAGE('replication.master.slaves.Offset') AS `Average Replication Byte Offset(Slaves)`, AVERAGE(replication.MasterReplOffset) AS `Average Replication Byte Offset(Master)` FROM GcpRedisInstanceSample WHERE (`provider` = 'GcpRedisInstance') FACET slave TIMESERIES AUTO"
               }
             ],
             "platformOptions": {

From 4f54b21c51df0e3b837ba652c11056dc284ffc02 Mon Sep 17 00:00:00 2001
From: Doua Vue <dvue@newrelic.com>
Date: Tue, 15 Oct 2024 09:00:11 -0500
Subject: [PATCH 07/10] feat: Update k8s otel description

---
 .../kubernetes-opentelemetry/config.yml       | 63 +++++++++++--------
 1 file changed, 36 insertions(+), 27 deletions(-)

diff --git a/quickstarts/kubernetes-opentelemetry/config.yml b/quickstarts/kubernetes-opentelemetry/config.yml
index 2900593745..1a4e7592a1 100644
--- a/quickstarts/kubernetes-opentelemetry/config.yml
+++ b/quickstarts/kubernetes-opentelemetry/config.yml
@@ -1,43 +1,53 @@
 slug: kubernetes-opentelemetry
 title: Kubernetes (OpenTelemetry)
 description: |
-  ## Why monitor Kubernetes?
+  ## Why monitor Kubernetes using OpenTelemetry?
+  Kubernetes is an open-source system for automating deployment, scaling, and, management of containerized applications. 
+  OpenTelemetry is an open source observability framework that provides IT teams with standardized protocols and tools for collecting and routing telemetry.
+  Organizations adopting OpenTelemetry will get advantage of vendor neutrality by using flexible and open-source agents and/or SDKs.
 
-  Kubernetes is an open-source system for automating deployment, scaling, and, management of containerized applications. The New Relic Kubernetes monitoring quickstart gives you visibility into your Kubernetes clusters and workloads in minutes, whether your clusters are hosted on-premises or in the cloud.
+  New Relic provides OpenTelemetry observability for Kubernetes which aims not only to ingest all the data sent but also to provide first-class K8s experiences and insights.
 
+  This quicktart gives you visibility into your Kubernetes clusters and workloads in minutes, whether your clusters are hosted on-premises or in the cloud.
   ### Kubernetes (OpenTelemetry) quickstart highlights
-
-  The New Relic Kubernetes quickstart uses dashboards to proactively monitor your metrics, like:
-
-  - resources used
-  - number of K8s objects
-  - namespaces per cluster
-  - pods by namespace
-  - container cpu usage
-  - container restarts
-  - missing pods by deployment
-  - node resource consumption, and more.
-
-  This quickstart is also compatible with on-host integrations like:
-
-  - Cassandra
-  - MySQL
-  - Apache, and more.
-
+  Included in this quickstart you will find:
+
+  * Instructions to install our [K8s instrumentation with OpenTelemetry](https://docs.newrelic.com/docs/kubernetes-pixie/kubernetes-integration/installation/k8s-otel/).
+  * A complete recommended alert policy including alert conditions to be notified on most of the common relevant issues.
+      * Container CPU throttling is high (alert condition)
+      * Container high CPU utilization (alert condition)
+      * Container high memory utilization (alert condition)
+      * Container is restarting (alert condition)
+      * Container is waiting (alert condition)
+      * Daemonset is missing pods (alert condition)
+      * Deployment is missing pods (alert condition)
+      * Etcd fie descriptor utilization is high (alert condition)
+      * Etcd has no leader (alert condition)
+      * HPA current replicas < desired replicas (alert condition)
+      * HPA has reached maximum replicas (alert condition)
+      * Job Failed (alert condition)
+      * More than 5 pods failing in namespace (alert condition)
+      * Node allocatable CPU utilization is high (alert condition)
+      * Node allocatable memory utilization is high (alert condition)
+      * Node is not ready (alert condition)
+      * Node is unschedulable (alert condition)
+      * Node pod count nearing capacity (alert condition)
+      * Node root file system capacity utilization is high (alert condition)
+      * Persistent volume has errors (alert condition)
+      * Pod cannot be scheduled (alert condition)
+      * Pod is not ready (alert condition)
+      * Statefulset is missing pods (alert condition)
   ### New Relic + Kubernetes = Optimum performance monitoring
-
-  The [New Relic Kubernetes (OpenTelemetry)](https://docs.newrelic.com/docs/integrations/kubernetes-integration/installation/kubernetes-integration-install-configure/) quickstart has multiple components that work together to give you end-to-end observability across your clusters. While you have the flexibility to deploy the components that you prefer, to achieve full observability, you need to install the complete package to monitor all metrics. Use our quickstart to generate a Kubernetes manifest and add Pixie for more fine-grained telemetry data. You can also do the installation with Pixie for fine-grained telemetry data.
-  Our quickstart monitors the aggregated core and memory usage across all nodes in your cluster. This allows you to meet resource requirements for optimal application performance. It also empowers you to track resource consumption, find pods that aren't running, monitor disk usage, and troubleshoot container restarts. The New Relic Kubernetes integration has dashboards and a cluster explorer that provide a multi-dimensional representation of a Kubernetes cluster from which you can explore your namespaces, deployments, nodes, pods, containers, and applications. Download the New Relic Kubernetes quickstart today to gain instant visibility into your Kubernetes services, clusters and workloads in minutes.
 summary: |
-  Monitoring Kubernetes is crucial to gain instant visibility into Kubernetes clusters and workloads. Download New Relic Kubernetes quickstart to proactively monitor Kubernetes cluster health and capacity.
+  Monitoring Kubernetes with OpenTelemetry is crucial to gain instant visibility into Kubernetes clusters and workloads using open-source agents which provide vendor neutrality.
+
 level: New Relic
 authors:
   - New Relic
 documentation:
   - name: Kubernetes (Opentelemetry) installation docs
     description: |
-      Kubernetes is an open-source container-orchestration system for automating
-      computer application deployment, scaling, and management.
+      OpenTelemetry observability for Kubernetes provides complete, open-source setup paired with a top-notch Kubernetes UI that is already compatible with our proprietary Kubernetes instrumentation. Our K8s UIs are designed to be provider agnostic, allowing you to select either OpenTelemetry or New Relic instrumentation based on your needs.
     url: >-
       https://docs.newrelic.com/docs/kubernetes-pixie/kubernetes-integration/installation/k8s-otel/#install
 dataSourceIds:
@@ -45,7 +55,6 @@ dataSourceIds:
 keywords:
   - kubernetes
   - containers
-  - pixie
   - k8s
   - opentelemetry
 alertPolicies:

From 5439de35a07d9bf455e380339786d237497115fe Mon Sep 17 00:00:00 2001
From: Doua Vue <dvue@newrelic.com>
Date: Wed, 16 Oct 2024 09:00:35 -0500
Subject: [PATCH 08/10] fix: Add icon key/value

---
 quickstarts/kubernetes-opentelemetry/config.yml | 1 +
 1 file changed, 1 insertion(+)

diff --git a/quickstarts/kubernetes-opentelemetry/config.yml b/quickstarts/kubernetes-opentelemetry/config.yml
index 1a4e7592a1..ef24cee69f 100644
--- a/quickstarts/kubernetes-opentelemetry/config.yml
+++ b/quickstarts/kubernetes-opentelemetry/config.yml
@@ -41,6 +41,7 @@ description: |
 summary: |
   Monitoring Kubernetes with OpenTelemetry is crucial to gain instant visibility into Kubernetes clusters and workloads using open-source agents which provide vendor neutrality.
 
+icon: logo.svg
 level: New Relic
 authors:
   - New Relic

From 12115d369d60fa177a00b35ce35e28e0e12191ae Mon Sep 17 00:00:00 2001
From: nr-opensource-bot <opensource+bot@newrelic.com>
Date: Thu, 17 Oct 2024 18:36:01 +0000
Subject: [PATCH 09/10] chore: generate UUID(s) [skip ci]

---
 quickstarts/kubernetes-opentelemetry/config.yml | 1 +
 1 file changed, 1 insertion(+)

diff --git a/quickstarts/kubernetes-opentelemetry/config.yml b/quickstarts/kubernetes-opentelemetry/config.yml
index ef24cee69f..aa9eed87af 100644
--- a/quickstarts/kubernetes-opentelemetry/config.yml
+++ b/quickstarts/kubernetes-opentelemetry/config.yml
@@ -1,3 +1,4 @@
+id: 7cc82a78-e523-4d35-bba9-aee81029d0f7
 slug: kubernetes-opentelemetry
 title: Kubernetes (OpenTelemetry)
 description: |

From 599132fb10bd7f3ed19023e69d7ee1dd3b19b87d Mon Sep 17 00:00:00 2001
From: Michel Losier <mlosier@newrelic.com>
Date: Thu, 17 Oct 2024 11:48:17 -0700
Subject: [PATCH 10/10] triggering the build