From 24dcb4e4ae2ca92579b72056611f5395bd45fce0 Mon Sep 17 00:00:00 2001 From: Christian Schlotter Date: Fri, 13 Dec 2024 11:07:37 +0100 Subject: [PATCH] vspherevm: don't requeue on deletenode when there is no ClusterCache connection --- controllers/vspherevm_controller.go | 21 +++++++++------------ 1 file changed, 9 insertions(+), 12 deletions(-) diff --git a/controllers/vspherevm_controller.go b/controllers/vspherevm_controller.go index 3f7e99c4eb..5a5dd0a89b 100644 --- a/controllers/vspherevm_controller.go +++ b/controllers/vspherevm_controller.go @@ -357,14 +357,10 @@ func (r vmReconciler) reconcileDelete(ctx context.Context, vmCtx *capvcontext.VM } // Attempt to delete the node corresponding to the vsphere VM - result, err = r.deleteNode(ctx, vmCtx, vm.Name) + err = r.deleteNode(ctx, vmCtx, vm.Name) if err != nil { log.Error(err, "Failed to delete Node (best-effort)") } - if !result.IsZero() { - // a non-zero value means we need to requeue the request before proceed. - return result, nil - } if err := r.deleteIPAddressClaims(ctx, vmCtx); err != nil { return reconcile.Result{}, err @@ -382,26 +378,27 @@ func (r vmReconciler) reconcileDelete(ctx context.Context, vmCtx *capvcontext.VM // This is necessary since CAPI does not surface the nodeRef field on the owner Machine object // until the node moves to Ready state. Hence, on Machine deletion it is unable to delete // the kubernetes node corresponding to the VM. -func (r vmReconciler) deleteNode(ctx context.Context, vmCtx *capvcontext.VMContext, name string) (reconcile.Result, error) { +// Note: If this fails, CPI normally cleans up orphaned nodes. +func (r vmReconciler) deleteNode(ctx context.Context, vmCtx *capvcontext.VMContext, name string) error { log := ctrl.LoggerFrom(ctx) // Fetching the cluster object from the VSphereVM object to create a remote client to the cluster cluster, err := clusterutilv1.GetClusterFromMetadata(ctx, r.Client, vmCtx.VSphereVM.ObjectMeta) if err != nil { - return ctrl.Result{}, err + return err } // Skip deleting the Node if the cluster is being deleted. if !cluster.DeletionTimestamp.IsZero() { - return ctrl.Result{}, nil + return nil } clusterClient, err := r.clusterCache.GetClient(ctx, ctrlclient.ObjectKeyFromObject(cluster)) if err != nil { if errors.Is(err, clustercache.ErrClusterNotConnected) { - log.V(5).Info("Requeuing because connection to the workload cluster is down") - return ctrl.Result{RequeueAfter: time.Minute}, nil + log.V(2).Info("Skipping node deletion because connection to the workload cluster is down") + return nil } - return ctrl.Result{}, err + return err } // Attempt to delete the corresponding node @@ -410,7 +407,7 @@ func (r vmReconciler) deleteNode(ctx context.Context, vmCtx *capvcontext.VMConte Name: name, }, } - return ctrl.Result{}, clusterClient.Delete(ctx, node) + return clusterClient.Delete(ctx, node) } func (r vmReconciler) reconcileNormal(ctx context.Context, vmCtx *capvcontext.VMContext) (reconcile.Result, error) {