Skip to content

Commit

Permalink
feat: add resourceDiscovery status condition (#223)
Browse files Browse the repository at this point in the history
* feat: add resourceDiscovery status condition

The ResourceSelector field in a MonitoringStack CR can be set to nil.
This is passed on to the Prometheus CR and can be used to disable all
service discovery and thus most scraping (we add prometheus and
alertmanager scrape jobs via additionalScrapeConfigs).
When this is configured we now set a new status condition to alert users
to the fact that no service discovery is configured.

Fixes: https://issues.redhat.com/browse/MON-2864

* refactor: updateConditions should update previously not existing conditions

Problem: Before this commit only an empty Conditions list would initialize all
conditions. This means that if the controller gets updated to report a
new conditions and existing MonitoringStack CR would not report that new
conditions until its recreated.

Fix: Update all conditions independently of the previously reported
conditions.

Signed-off-by: Jan Fajerski <jfajersk@redhat.com>
  • Loading branch information
jan--f committed Dec 21, 2022
1 parent bc3b0d2 commit 1ea726d
Show file tree
Hide file tree
Showing 9 changed files with 333 additions and 202 deletions.
5 changes: 4 additions & 1 deletion bundle/manifests/monitoring.rhobs_monitoringstacks.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -835,7 +835,10 @@ spec:
type: integer
type: object
resourceSelector:
description: Label selector for Monitoring Stack Resources.
description: Label selector for Monitoring Stack Resources. Set to
the empty LabelSelector ({}) to monitoring everything. Set to null
to disable service discovery.
nullable: true
properties:
matchExpressions:
description: matchExpressions is a list of label selector requirements.
Expand Down
5 changes: 4 additions & 1 deletion deploy/crds/common/monitoring.rhobs_monitoringstacks.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -836,7 +836,10 @@ spec:
type: integer
type: object
resourceSelector:
description: Label selector for Monitoring Stack Resources.
description: Label selector for Monitoring Stack Resources. Set to
the empty LabelSelector ({}) to monitoring everything. Set to null
to disable service discovery.
nullable: true
properties:
matchExpressions:
description: matchExpressions is a list of label selector requirements.
Expand Down
4 changes: 2 additions & 2 deletions docs/api.md
Original file line number Diff line number Diff line change
Expand Up @@ -124,7 +124,7 @@ MonitoringStackSpec is the specification for desired Monitoring Stack
<td><b><a href="#monitoringstackspecresourceselector">resourceSelector</a></b></td>
<td>object</td>
<td>
Label selector for Monitoring Stack Resources.<br/>
Label selector for Monitoring Stack Resources. Set to the empty LabelSelector ({}) to monitoring everything. Set to null to disable service discovery.<br/>
</td>
<td>false</td>
</tr><tr>
Expand Down Expand Up @@ -1803,7 +1803,7 @@ RelabelConfig allows dynamic rewriting of the label set, being applied to sample



Label selector for Monitoring Stack Resources.
Label selector for Monitoring Stack Resources. Set to the empty LabelSelector ({}) to monitoring everything. Set to null to disable service discovery.

<table>
<thead>
Expand Down
10 changes: 7 additions & 3 deletions pkg/apis/monitoring/v1alpha1/types.go
Original file line number Diff line number Diff line change
Expand Up @@ -58,8 +58,11 @@ type MonitoringStackSpec struct {
LogLevel LogLevel `json:"logLevel,omitempty"`

// Label selector for Monitoring Stack Resources.
// Set to the empty LabelSelector ({}) to monitoring everything.
// Set to null to disable service discovery.
// +optional
ResourceSelector *metav1.LabelSelector `json:"resourceSelector,omitempty"`
// +nullable
ResourceSelector *metav1.LabelSelector `json:"resourceSelector"`

// Namespace selector for Monitoring Stack Resources.
// If left empty the Monitoring Stack will only match resources in the namespace it was created in.
Expand Down Expand Up @@ -108,8 +111,9 @@ const (
ConditionFalse ConditionStatus = "False"
ConditionUnknown ConditionStatus = "Unknown"

ReconciledCondition ConditionType = "Reconciled"
AvailableCondition ConditionType = "Available"
ReconciledCondition ConditionType = "Reconciled"
AvailableCondition ConditionType = "Available"
ResourceDiscoveryCondition ConditionType = "ResourceDiscovery"
)

type Condition struct {
Expand Down
3 changes: 0 additions & 3 deletions pkg/controllers/monitoring/monitoring-stack/components.go
Original file line number Diff line number Diff line change
Expand Up @@ -108,9 +108,6 @@ func newPrometheus(
instanceSelectorValue string,
) *monv1.Prometheus {
prometheusSelector := ms.Spec.ResourceSelector
if prometheusSelector == nil {
prometheusSelector = &metav1.LabelSelector{}
}

config := ms.Spec.PrometheusConfig

Expand Down
110 changes: 71 additions & 39 deletions pkg/controllers/monitoring/monitoring-stack/conditions.go
Original file line number Diff line number Diff line change
Expand Up @@ -15,60 +15,78 @@ const (
PrometheusNotAvailable = "PrometheusNotAvailable"
PrometheusNotReconciled = "PrometheusNotReconciled"
PrometheusDegraded = "PrometheusDegraded"
ResourceSelectorIsNil = "ResourceSelectorNil"
CannotReadPrometheusConditions = "Cannot read Prometheus status conditions"
AvailableMessage = "Monitoring Stack is available"
SuccessfullyReconciledMessage = "Monitoring Stack is successfully reconciled"
ResourceSelectorIsNilMessage = "No resources will be discovered, ResourceSelector is nil"
ResourceDiscoveryOnMessage = "Resource discovery is operational"
NoReason = "None"
)

func updateConditions(msConditions []v1alpha1.Condition, prom monv1.Prometheus, generation int64, recError error) []v1alpha1.Condition {
if len(msConditions) == 0 {
return []v1alpha1.Condition{
{
Type: v1alpha1.AvailableCondition,
Status: v1alpha1.ConditionUnknown,
Reason: NoReason,
LastTransitionTime: metav1.Now(),
},
{
Type: v1alpha1.ReconciledCondition,
Status: v1alpha1.ConditionUnknown,
Reason: NoReason,
LastTransitionTime: metav1.Now(),
},
func updateConditions(ms *v1alpha1.MonitoringStack, prom monv1.Prometheus, recError error) []v1alpha1.Condition {
return []v1alpha1.Condition{
updateResourceDiscovery(ms),
updateAvailable(ms.Status.Conditions, prom, ms.Generation),
updateReconciled(ms.Status.Conditions, prom, ms.Generation, recError),
}
}

func getMSCondition(conditions []v1alpha1.Condition, t v1alpha1.ConditionType) (v1alpha1.Condition, error) {
for _, c := range conditions {
if c.Type == t {
return c, nil
}
}
var updatedConditions []v1alpha1.Condition

for _, mc := range msConditions {
switch mc.Type {
case v1alpha1.AvailableCondition:
available := updateAvailable(mc, prom, generation)
if !available.Equal(mc) {
available.LastTransitionTime = metav1.Now()
}
updatedConditions = append(updatedConditions, available)
case v1alpha1.ReconciledCondition:
reconciled := updateReconciled(mc, prom, generation, recError)
if !reconciled.Equal(mc) {
reconciled.LastTransitionTime = metav1.Now()
}
updatedConditions = append(updatedConditions, reconciled)
return v1alpha1.Condition{}, fmt.Errorf("condition type %v not found", t)
}

// updateResourceDiscovery updates the ResourceDiscoveryCondition based on the
// ResourceSelector in the MonitorinStack spec. A ResourceSelector of nil causes
// the condition to be false, any other value sets the condition to true
func updateResourceDiscovery(ms *v1alpha1.MonitoringStack) v1alpha1.Condition {
if ms.Spec.ResourceSelector == nil {
return v1alpha1.Condition{
Type: v1alpha1.ResourceDiscoveryCondition,
Status: v1alpha1.ConditionFalse,
Reason: ResourceSelectorIsNil,
Message: ResourceSelectorIsNilMessage,
LastTransitionTime: metav1.Now(),
ObservedGeneration: ms.Generation,
}
} else {
return v1alpha1.Condition{
Type: v1alpha1.ResourceDiscoveryCondition,
Status: v1alpha1.ConditionTrue,
Reason: NoReason,
Message: ResourceDiscoveryOnMessage,
LastTransitionTime: metav1.Now(),
ObservedGeneration: ms.Generation,
}
}

return updatedConditions
}

// updateAvailable gets existing "Available" condition and updates its parameters
// based on the Prometheus "Available" condition
func updateAvailable(ac v1alpha1.Condition, prom monv1.Prometheus, generation int64) v1alpha1.Condition {
func updateAvailable(conditions []v1alpha1.Condition, prom monv1.Prometheus, generation int64) v1alpha1.Condition {
ac, err := getMSCondition(conditions, v1alpha1.AvailableCondition)
if err != nil {
ac = v1alpha1.Condition{
Type: v1alpha1.AvailableCondition,
Status: v1alpha1.ConditionUnknown,
Reason: NoReason,
LastTransitionTime: metav1.Now(),
}
}

prometheusAvailable, err := getPrometheusCondition(prom.Status.Conditions, monv1.PrometheusAvailable)

if err != nil {
ac.Status = v1alpha1.ConditionUnknown
ac.Reason = PrometheusNotAvailable
ac.Message = CannotReadPrometheusConditions
ac.LastTransitionTime = metav1.Now()
return ac
}
// MonitoringStack status will not be updated if there is a difference between the Prometheus generation
Expand All @@ -85,31 +103,43 @@ func updateAvailable(ac v1alpha1.Condition, prom monv1.Prometheus, generation in
ac.Reason = PrometheusNotAvailable
}
ac.Message = prometheusAvailable.Message
ac.LastTransitionTime = metav1.Now()
return ac
}
ac.Status = v1alpha1.ConditionTrue
ac.Reason = AvailableReason
ac.Message = AvailableMessage
ac.ObservedGeneration = generation
ac.LastTransitionTime = metav1.Now()
return ac
}

// updateReconciled updates "Reconciled" conditions based on the provided error value and
// Prometheus "Reconciled" condition
func updateReconciled(rc v1alpha1.Condition, prom monv1.Prometheus, generation int64, err error) v1alpha1.Condition {

if err != nil {
func updateReconciled(conditions []v1alpha1.Condition, prom monv1.Prometheus, generation int64, reconcileErr error) v1alpha1.Condition {
rc, cErr := getMSCondition(conditions, v1alpha1.ReconciledCondition)
if cErr != nil {
rc = v1alpha1.Condition{
Type: v1alpha1.ReconciledCondition,
Status: v1alpha1.ConditionUnknown,
Reason: NoReason,
LastTransitionTime: metav1.Now(),
}
}
if reconcileErr != nil {
rc.Status = v1alpha1.ConditionFalse
rc.Message = err.Error()
rc.Message = reconcileErr.Error()
rc.Reason = FailedToReconcileReason
rc.LastTransitionTime = metav1.Now()
return rc
}
prometheusReconciled, err := getPrometheusCondition(prom.Status.Conditions, monv1.PrometheusReconciled)
prometheusReconciled, reconcileErr := getPrometheusCondition(prom.Status.Conditions, monv1.PrometheusReconciled)

if err != nil {
if reconcileErr != nil {
rc.Status = v1alpha1.ConditionUnknown
rc.Reason = PrometheusNotReconciled
rc.Message = CannotReadPrometheusConditions
rc.LastTransitionTime = metav1.Now()
return rc
}

Expand All @@ -121,12 +151,14 @@ func updateReconciled(rc v1alpha1.Condition, prom monv1.Prometheus, generation i
rc.Status = prometheusStatusToMSStatus(prometheusReconciled.Status)
rc.Reason = PrometheusNotReconciled
rc.Message = prometheusReconciled.Message
rc.LastTransitionTime = metav1.Now()
return rc
}
rc.Status = v1alpha1.ConditionTrue
rc.Reason = ReconciledReason
rc.Message = SuccessfullyReconciledMessage
rc.ObservedGeneration = generation
rc.LastTransitionTime = metav1.Now()
return rc
}

Expand Down
Loading

0 comments on commit 1ea726d

Please sign in to comment.