From ddda8e1292e3011844864d66125221a4dc19e1cd Mon Sep 17 00:00:00 2001 From: Michael Burman Date: Thu, 27 Jun 2024 12:01:05 +0300 Subject: [PATCH] =?UTF-8?q?Add=20MinReadySeconds=20to=205=20in=20StatefulS?= =?UTF-8?q?ets=20to=20prevent=20sudden=20double=20res=E2=80=A6=20(#647)?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit * Add Spec.MindReadySeconds to allow setting a non-default value for MinReadySeconds in StatefulSets. Set the default MinReadySeconds to 5 in StatefulSets to prevent sudden double restarts from statefulset controller. * Modify unit test to ensure value is set * Add additional test that the change is actually applied --- CHANGELOG.md | 2 ++ .../v1beta1/cassandradatacenter_types.go | 4 +++ .../v1beta1/zz_generated.deepcopy.go | 5 +++ ...dra.datastax.com_cassandradatacenters.yaml | 6 ++++ pkg/reconciliation/construct_statefulset.go | 5 +++ .../construct_statefulset_test.go | 33 +++++++++++++++++++ 6 files changed, 55 insertions(+) diff --git a/CHANGELOG.md b/CHANGELOG.md index 519d786d..84aa0d47 100644 --- a/CHANGELOG.md +++ b/CHANGELOG.md @@ -11,6 +11,8 @@ Changelog for Cass Operator, new PRs should update the `main / unreleased` secti ## unreleased +* [ENHANCEMENT] [#648](https://github.com/k8ssandra/cass-operator/issues/648) Make MinReadySeconds configurable value in the Spec. + ## v1.21.1 * [BUGFIX] [#665](https://github.com/k8ssandra/cass-operator/issues/665) The RequiresUpdate and ObservedGenerations were updated too often, even when the reconcile was not finished. diff --git a/apis/cassandra/v1beta1/cassandradatacenter_types.go b/apis/cassandra/v1beta1/cassandradatacenter_types.go index fc4a76c4..35f27b36 100644 --- a/apis/cassandra/v1beta1/cassandradatacenter_types.go +++ b/apis/cassandra/v1beta1/cassandradatacenter_types.go @@ -258,6 +258,10 @@ type CassandraDatacenterSpec struct { // Use cautiously. // +optional DatacenterName string `json:"datacenterName,omitempty"` + + // MinReadySeconds sets the minimum number of seconds for which a newly created pod should be ready without any of its containers crashing, for it to be considered available. Defaults to 5 seconds and is set in the StatefulSet spec. + // Setting to 0 might cause multiple Cassandra pods to restart at the same time despite PodDisruptionBudget settings. + MinReadySeconds *int32 `json:"minReadySeconds,omitempty"` } type NetworkingConfig struct { diff --git a/apis/cassandra/v1beta1/zz_generated.deepcopy.go b/apis/cassandra/v1beta1/zz_generated.deepcopy.go index 63c077c8..ad4af351 100644 --- a/apis/cassandra/v1beta1/zz_generated.deepcopy.go +++ b/apis/cassandra/v1beta1/zz_generated.deepcopy.go @@ -357,6 +357,11 @@ func (in *CassandraDatacenterSpec) DeepCopyInto(out *CassandraDatacenterSpec) { *out = new(CDCConfiguration) (*in).DeepCopyInto(*out) } + if in.MinReadySeconds != nil { + in, out := &in.MinReadySeconds, &out.MinReadySeconds + *out = new(int32) + **out = **in + } } // DeepCopy is an autogenerated deepcopy function, copying the receiver, creating a new CassandraDatacenterSpec. diff --git a/config/crd/bases/cassandra.datastax.com_cassandradatacenters.yaml b/config/crd/bases/cassandra.datastax.com_cassandradatacenters.yaml index 65605344..74558566 100644 --- a/config/crd/bases/cassandra.datastax.com_cassandradatacenters.yaml +++ b/config/crd/bases/cassandra.datastax.com_cassandradatacenters.yaml @@ -348,6 +348,12 @@ spec: - serverSecretName type: object type: object + minReadySeconds: + description: |- + MinReadySeconds sets the minimum number of seconds for which a newly created pod should be ready without any of its containers crashing, for it to be considered available. Defaults to 5 seconds and is set in the StatefulSet spec. + Setting to 0 might cause multiple Cassandra pods to restart at the same time despite PodDisruptionBudget settings. + format: int32 + type: integer networking: properties: hostNetwork: diff --git a/pkg/reconciliation/construct_statefulset.go b/pkg/reconciliation/construct_statefulset.go index a9b1ca81..f9227710 100644 --- a/pkg/reconciliation/construct_statefulset.go +++ b/pkg/reconciliation/construct_statefulset.go @@ -145,6 +145,7 @@ func newStatefulSetForCassandraDatacenter( PodManagementPolicy: appsv1.ParallelPodManagement, Template: *template, VolumeClaimTemplates: volumeClaimTemplates, + MinReadySeconds: 5, }, } @@ -169,6 +170,10 @@ func newStatefulSetForCassandraDatacenter( result.Spec.UpdateStrategy = strategy } + if dc.Spec.MinReadySeconds != nil { + result.Spec.MinReadySeconds = *dc.Spec.MinReadySeconds + } + // add a hash here to facilitate checking if updates are needed utils.AddHashAnnotation(result) diff --git a/pkg/reconciliation/construct_statefulset_test.go b/pkg/reconciliation/construct_statefulset_test.go index 3db9d14e..45e02997 100644 --- a/pkg/reconciliation/construct_statefulset_test.go +++ b/pkg/reconciliation/construct_statefulset_test.go @@ -420,6 +420,7 @@ func Test_newStatefulSetForCassandraDatacenterWithAdditionalVolumes(t *testing.T assert.Equal(t, 1, len(got.Spec.Template.Spec.InitContainers[1].VolumeMounts)) assert.Equal(t, "server-config", got.Spec.Template.Spec.InitContainers[1].VolumeMounts[0].Name) assert.Equal(t, "/config", got.Spec.Template.Spec.InitContainers[1].VolumeMounts[0].MountPath) + assert.Equal(t, int32(5), got.Spec.MinReadySeconds) } } @@ -711,3 +712,35 @@ func TestPodTemplateSpecHashAnnotationChanges(t *testing.T) { updatedHash = sts.Annotations[utils.ResourceHashAnnotationKey] assert.NotEqual(currentHash, updatedHash, "expected hash to change when PodTemplateSpec labels change") } + +func TestMinReadySecondsChange(t *testing.T) { + assert := assert.New(t) + dc := &api.CassandraDatacenter{ + Spec: api.CassandraDatacenterSpec{ + ClusterName: "test", + ServerType: "cassandra", + ServerVersion: "4.0.7", + StorageConfig: api.StorageConfig{ + CassandraDataVolumeClaimSpec: &corev1.PersistentVolumeClaimSpec{}, + }, + Racks: []api.Rack{ + { + Name: "testrack", + }, + }, + PodTemplateSpec: &corev1.PodTemplateSpec{}, + }, + } + + sts, err := newStatefulSetForCassandraDatacenter(nil, dc.Spec.Racks[0].Name, dc, 3) + assert.NoError(err, "failed to build statefulset") + + assert.Equal(int32(5), sts.Spec.MinReadySeconds) + + dc.Spec.MinReadySeconds = ptr.To[int32](10) + + sts, err = newStatefulSetForCassandraDatacenter(nil, dc.Spec.Racks[0].Name, dc, 3) + assert.NoError(err, "failed to build statefulset") + + assert.Equal(int32(10), sts.Spec.MinReadySeconds) +}