Skip to content

Commit ee02966

Browse files
authored
Merge pull request #91 from arangodb/tracking-terminations
Tracking recent pod terminations
2 parents d8d590c + fbc0d1b commit ee02966

File tree

6 files changed

+112
-1
lines changed

6 files changed

+112
-1
lines changed

pkg/apis/deployment/v1alpha/member_status.go

Lines changed: 42 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -22,6 +22,12 @@
2222

2323
package v1alpha
2424

25+
import (
26+
"time"
27+
28+
metav1 "k8s.io/apimachinery/pkg/apis/meta/v1"
29+
)
30+
2531
// MemberStatus holds the current status of a single member (server)
2632
type MemberStatus struct {
2733
// ID holds the unique ID of the member.
@@ -35,4 +41,40 @@ type MemberStatus struct {
3541
PodName string `json:"podName,omitempty"`
3642
// Conditions specific to this member
3743
Conditions ConditionList `json:"conditions,omitempty"`
44+
// RecentTerminatons holds the times when this member was recently terminated.
45+
// First entry is the oldest. (do not add omitempty, since we want to be able to switch from a list to an empty list)
46+
RecentTerminations []metav1.Time `json:"recent-terminations"`
47+
}
48+
49+
// RemoveTerminationsBefore removes all recent terminations before the given timestamp.
50+
// It returns the number of terminations that have been removed.
51+
func (s *MemberStatus) RemoveTerminationsBefore(timestamp time.Time) int {
52+
removed := 0
53+
for {
54+
if len(s.RecentTerminations) == 0 {
55+
// Nothing left
56+
return removed
57+
}
58+
if s.RecentTerminations[0].Time.Before(timestamp) {
59+
// Let's remove it
60+
s.RecentTerminations = s.RecentTerminations[1:]
61+
removed++
62+
} else {
63+
// First (oldest) is not before given timestamp, we're done
64+
return removed
65+
}
66+
}
67+
}
68+
69+
// RecentTerminationsSince returns the number of terminations since the given timestamp.
70+
func (s MemberStatus) RecentTerminationsSince(timestamp time.Time) int {
71+
count := 0
72+
for idx := len(s.RecentTerminations) - 1; idx >= 0; idx-- {
73+
if s.RecentTerminations[idx].Time.Before(timestamp) {
74+
// This termination is before the timestamp, so we're done
75+
return count
76+
}
77+
count++
78+
}
79+
return count
3880
}
Lines changed: 53 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,53 @@
1+
//
2+
// DISCLAIMER
3+
//
4+
// Copyright 2018 ArangoDB GmbH, Cologne, Germany
5+
//
6+
// Licensed under the Apache License, Version 2.0 (the "License");
7+
// you may not use this file except in compliance with the License.
8+
// You may obtain a copy of the License at
9+
//
10+
// http://www.apache.org/licenses/LICENSE-2.0
11+
//
12+
// Unless required by applicable law or agreed to in writing, software
13+
// distributed under the License is distributed on an "AS IS" BASIS,
14+
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
15+
// See the License for the specific language governing permissions and
16+
// limitations under the License.
17+
//
18+
// Copyright holder is ArangoDB GmbH, Cologne, Germany
19+
//
20+
// Author Ewout Prangsma
21+
//
22+
23+
package v1alpha
24+
25+
import (
26+
"testing"
27+
"time"
28+
29+
"github.com/stretchr/testify/assert"
30+
metav1 "k8s.io/apimachinery/pkg/apis/meta/v1"
31+
)
32+
33+
// TestMemberStatusRecentTerminations tests the functions related to MemberStatus.RecentTerminations.
34+
func TestMemberStatusRecentTerminations(t *testing.T) {
35+
relTime := func(delta time.Duration) metav1.Time {
36+
return metav1.Time{Time: time.Now().Add(delta)}
37+
}
38+
39+
s := MemberStatus{}
40+
assert.Equal(t, 0, s.RecentTerminationsSince(time.Now().Add(-time.Hour)))
41+
assert.Equal(t, 0, s.RemoveTerminationsBefore(time.Now()))
42+
43+
s.RecentTerminations = []metav1.Time{metav1.Now()}
44+
assert.Equal(t, 1, s.RecentTerminationsSince(time.Now().Add(-time.Minute)))
45+
assert.Equal(t, 0, s.RecentTerminationsSince(time.Now().Add(time.Minute)))
46+
assert.Equal(t, 0, s.RemoveTerminationsBefore(time.Now().Add(-time.Hour)))
47+
48+
s.RecentTerminations = []metav1.Time{relTime(-time.Hour), relTime(-time.Minute), relTime(time.Minute)}
49+
assert.Equal(t, 3, s.RecentTerminationsSince(time.Now().Add(-time.Hour*2)))
50+
assert.Equal(t, 2, s.RecentTerminationsSince(time.Now().Add(-time.Minute*2)))
51+
assert.Equal(t, 2, s.RemoveTerminationsBefore(time.Now()))
52+
assert.Len(t, s.RecentTerminations, 1)
53+
}

pkg/apis/deployment/v1alpha/zz_generated.deepcopy.go

Lines changed: 7 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -371,6 +371,13 @@ func (in *MemberStatus) DeepCopyInto(out *MemberStatus) {
371371
(*in)[i].DeepCopyInto(&(*out)[i])
372372
}
373373
}
374+
if in.RecentTerminations != nil {
375+
in, out := &in.RecentTerminations, &out.RecentTerminations
376+
*out = make([]v1.Time, len(*in))
377+
for i := range *in {
378+
(*in)[i].DeepCopyInto(&(*out)[i])
379+
}
380+
}
374381
return
375382
}
376383

pkg/deployment/reconcile/action_rotate_member.go

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -110,6 +110,7 @@ func (a *actionRotateMember) CheckProgress(ctx context.Context) (bool, error) {
110110
}
111111
// Pod is now gone, update the member status
112112
m.State = api.MemberStateNone
113+
m.RecentTerminations = nil // Since we're rotating, we do not care about old terminations.
113114
if err := a.actionCtx.UpdateMember(m); err != nil {
114115
return false, maskAny(err)
115116
}

pkg/deployment/reconcile/action_upgrade_member.go

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -120,6 +120,7 @@ func (a *actionUpgradeMember) CheckProgress(ctx context.Context) (bool, error) {
120120
}
121121
// Pod is now gone, update the member status
122122
m.State = api.MemberStateNone
123+
m.RecentTerminations = nil // Since we're upgrading, we do not care about old terminations.
123124
if err := a.actionCtx.UpdateMember(m); err != nil {
124125
return false, maskAny(err)
125126
}

pkg/deployment/resources/pod_inspector.go

Lines changed: 8 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -26,11 +26,12 @@ import (
2626
"fmt"
2727
"time"
2828

29-
"github.com/arangodb/kube-arangodb/pkg/util/k8sutil"
3029
"k8s.io/api/core/v1"
30+
metav1 "k8s.io/apimachinery/pkg/apis/meta/v1"
3131

3232
api "github.com/arangodb/kube-arangodb/pkg/apis/deployment/v1alpha"
3333
"github.com/arangodb/kube-arangodb/pkg/metrics"
34+
"github.com/arangodb/kube-arangodb/pkg/util/k8sutil"
3435
)
3536

3637
var (
@@ -81,12 +82,18 @@ func (r *Resources) InspectPods() error {
8182
if memberStatus.Conditions.Update(api.ConditionTypeTerminated, true, "Pod Succeeded", "") {
8283
log.Debug().Str("pod-name", p.GetName()).Msg("Updating member condition Terminated to true: Pod Succeeded")
8384
updateMemberStatusNeeded = true
85+
// Record termination time
86+
now := metav1.Now()
87+
memberStatus.RecentTerminations = append(memberStatus.RecentTerminations, now)
8488
}
8589
} else if k8sutil.IsPodFailed(&p) {
8690
// Pod has terminated with at least 1 container with a non-zero exit code.
8791
if memberStatus.Conditions.Update(api.ConditionTypeTerminated, true, "Pod Failed", "") {
8892
log.Debug().Str("pod-name", p.GetName()).Msg("Updating member condition Terminated to true: Pod Failed")
8993
updateMemberStatusNeeded = true
94+
// Record termination time
95+
now := metav1.Now()
96+
memberStatus.RecentTerminations = append(memberStatus.RecentTerminations, now)
9097
}
9198
}
9299
if k8sutil.IsPodReady(&p) {

0 commit comments

Comments
 (0)