Skip to content

Commit

Permalink
Don't remove controlnode from cluster too early (#887)
Browse files Browse the repository at this point in the history
Signed-off-by: Alexey Makhov <amakhov@mirantis.com>
  • Loading branch information
makhov authored Jan 16, 2025
1 parent c6dc757 commit a845ab3
Show file tree
Hide file tree
Showing 2 changed files with 45 additions and 4 deletions.
38 changes: 38 additions & 0 deletions internal/controller/controlplane/helper.go
Original file line number Diff line number Diff line change
Expand Up @@ -344,6 +344,44 @@ func (c *K0sController) markChildControlNodeToLeave(ctx context.Context, name st
return nil
}

func (c *K0sController) deleteOldControlNodes(ctx context.Context, cluster *clusterv1.Cluster) error {
kubeClient, err := c.getKubeClient(ctx, cluster)
if err != nil {
return fmt.Errorf("error getting kube client: %w", err)
}
machines, err := collections.GetFilteredMachinesForCluster(ctx, c, cluster, collections.ControlPlaneMachines(cluster.Name))
if err != nil {
return fmt.Errorf("error getting all machines: %w", err)
}

var controlNodeList unstructured.UnstructuredList
err = kubeClient.RESTClient().
Get().
AbsPath("/apis/autopilot.k0sproject.io/v1beta2/controlnodes").
Do(ctx).
Into(&controlNodeList)

if err != nil && !apierrors.IsNotFound(err) {
return err
}

existingMachineNames := make(map[string]struct{})
for _, n := range machines.Names() {
existingMachineNames[n] = struct{}{}
}

for _, controlNode := range controlNodeList.Items {
if _, ok := existingMachineNames[controlNode.GetName()]; !ok {
err := c.deleteControlNode(ctx, controlNode.GetName(), kubeClient)
if err != nil {
return err
}
}
}

return nil
}

func (c *K0sController) deleteControlNode(ctx context.Context, name string, clientset *kubernetes.Clientset) error {
if clientset == nil {
return nil
Expand Down
11 changes: 7 additions & 4 deletions internal/controller/controlplane/k0s_controlplane_controller.go
Original file line number Diff line number Diff line change
Expand Up @@ -373,6 +373,13 @@ func (c *K0sController) reconcileMachines(ctx context.Context, cluster *clusterv
}
log.Log.Info("Collected machines", "count", machines.Len(), "desired", kcp.Spec.Replicas, "updating", clusterIsUpdating, "deleting", len(machineNamesToDelete), "desiredMachines", desiredMachineNames)

go func() {
err = c.deleteOldControlNodes(ctx, cluster)
if err != nil {
logger.Error(err, "Error deleting old control nodes")
}
}()

if clusterIsUpdating {
log.Log.Info("Cluster is updating", "currentVersion", currentVersion, "newVersion", kcp.Spec.Version, "strategy", kcp.Spec.UpdateStrategy)
if kcp.Spec.UpdateStrategy == cpv1beta1.UpdateRecreate {
Expand Down Expand Up @@ -499,10 +506,6 @@ func (c *K0sController) runMachineDeletionSequence(ctx context.Context, logger l
return fmt.Errorf("error checking machine left: %w", err)
}

if err := c.deleteControlNode(ctx, machine.Name, kubeClient); err != nil {
return fmt.Errorf("error deleting controlnode: %w", err)
}

if err := c.deleteBootstrapConfig(ctx, machine.Name, kcp); err != nil {
return fmt.Errorf("error deleting machine from template: %w", err)
}
Expand Down

0 comments on commit a845ab3

Please sign in to comment.