Skip to content

Commit 1af3b73

Browse files
zhangzujianoilbeater
authored andcommitted
gc: consider whether the sts pod is alive during lsp gc (#5122)
Signed-off-by: zhangzujian <[email protected]>
1 parent feea276 commit 1af3b73

File tree

2 files changed

+73
-12
lines changed

2 files changed

+73
-12
lines changed

pkg/controller/gc.go

+1-1
Original file line numberDiff line numberDiff line change
@@ -327,7 +327,7 @@ func (c *Controller) markAndCleanLSP() error {
327327
ipMap := strset.NewWithSize(len(pods) + len(nodes))
328328
for _, pod := range pods {
329329
if isStsPod, stsName, stsUID := isStatefulSetPod(pod); isStsPod {
330-
if isStatefulSetPodToDel(c.config.KubeClient, pod, stsName, stsUID) {
330+
if isStatefulSetPodToGC(c.config.KubeClient, pod, stsName, stsUID) {
331331
continue
332332
}
333333
} else if !isPodAlive(pod) {

pkg/controller/pod.go

+72-11
Original file line numberDiff line numberDiff line change
@@ -911,8 +911,8 @@ func (c *Controller) handleDeletePod(key string) (err error) {
911911

912912
var keepIPCR bool
913913
if ok, stsName, stsUID := isStatefulSetPod(pod); ok {
914-
if pod.DeletionTimestamp != nil {
915-
klog.Infof("handle deletion of sts pod %s", podName)
914+
if !pod.DeletionTimestamp.IsZero() {
915+
klog.Infof("handle deletion of sts pod %s", podKey)
916916
toDel := isStatefulSetPodToDel(c.config.KubeClient, pod, stsName, stsUID)
917917
if !toDel {
918918
klog.Infof("try keep ip for sts pod %s", podKey)
@@ -935,7 +935,7 @@ func (c *Controller) handleDeletePod(key string) (err error) {
935935
if isVMPod && c.config.EnableKeepVMIP {
936936
ports, err := c.OVNNbClient.ListNormalLogicalSwitchPorts(true, map[string]string{"pod": podKey})
937937
if err != nil {
938-
klog.Errorf("failed to list lsps of pod '%s', %v", pod.Name, err)
938+
klog.Errorf("failed to list lsps of pod %s: %v", podKey, err)
939939
return err
940940
}
941941
for _, port := range ports {
@@ -946,7 +946,7 @@ func (c *Controller) handleDeletePod(key string) (err error) {
946946
}
947947
}
948948
if pod.DeletionTimestamp != nil {
949-
klog.Infof("handle deletion of vm pod %s", podName)
949+
klog.Infof("handle deletion of vm pod %s", podKey)
950950
vmToBeDel := c.isVMToDel(pod, vmName)
951951
if !vmToBeDel {
952952
klog.Infof("try keep ip for vm pod %s", podKey)
@@ -968,12 +968,12 @@ func (c *Controller) handleDeletePod(key string) (err error) {
968968

969969
podNets, err := c.getPodKubeovnNets(pod)
970970
if err != nil {
971-
klog.Errorf("failed to get pod nets %v", err)
971+
klog.Errorf("failed to get kube-ovn nets of pod %s: %v", podKey, err)
972972
}
973973
if !keepIPCR {
974974
ports, err := c.OVNNbClient.ListNormalLogicalSwitchPorts(true, map[string]string{"pod": podKey})
975975
if err != nil {
976-
klog.Errorf("failed to list lsps of pod '%s', %v", pod.Name, err)
976+
klog.Errorf("failed to list lsps of pod %s: %v", podKey, err)
977977
return err
978978
}
979979

@@ -1259,16 +1259,20 @@ func isStatefulSetPodToDel(c kubernetes.Interface, pod *v1.Pod, statefulSetName
12591259
if err != nil {
12601260
// statefulset is deleted
12611261
if k8serrors.IsNotFound(err) {
1262-
klog.Infof("statefulset %s is deleted", statefulSetName)
1262+
klog.Infof("statefulset %s/%s has been deleted", pod.Namespace, statefulSetName)
12631263
return true
12641264
}
1265-
klog.Errorf("failed to get statefulset %v", err)
1265+
klog.Errorf("failed to get statefulset %s/%s: %v", pod.Namespace, statefulSetName, err)
12661266
return false
12671267
}
12681268

12691269
// statefulset is being deleted, or it's a newly created one
1270-
if !sts.DeletionTimestamp.IsZero() || sts.UID != statefulSetUID {
1271-
klog.Infof("statefulset %s is being deleted", statefulSetName)
1270+
if !sts.DeletionTimestamp.IsZero() {
1271+
klog.Infof("statefulset %s/%s is being deleted", pod.Namespace, statefulSetName)
1272+
return true
1273+
}
1274+
if sts.UID != statefulSetUID {
1275+
klog.Infof("statefulset %s/%s is a newly created one", pod.Namespace, statefulSetName)
12721276
return true
12731277
}
12741278

@@ -1286,9 +1290,66 @@ func isStatefulSetPodToDel(c kubernetes.Interface, pod *v1.Pod, statefulSetName
12861290
startOrdinal = int64(sts.Spec.Ordinals.Start)
12871291
}
12881292
if index >= startOrdinal+int64(*sts.Spec.Replicas) {
1289-
klog.Infof("statefulset %s is down scaled", statefulSetName)
1293+
klog.Infof("statefulset %s/%s is down scaled", pod.Namespace, statefulSetName)
1294+
return true
1295+
}
1296+
return false
1297+
}
1298+
1299+
// only gc statefulset pod lsp when:
1300+
// 1. the statefulset has been deleted or is being deleted
1301+
// 2. the statefulset has been deleted and recreated
1302+
// 3. the statefulset is down scaled and the pod is not alive
1303+
func isStatefulSetPodToGC(c kubernetes.Interface, pod *v1.Pod, statefulSetName string, statefulSetUID types.UID) bool {
1304+
sts, err := c.AppsV1().StatefulSets(pod.Namespace).Get(context.Background(), statefulSetName, metav1.GetOptions{})
1305+
if err != nil {
1306+
// the statefulset has been deleted
1307+
if k8serrors.IsNotFound(err) {
1308+
klog.Infof("statefulset %s/%s has been deleted", pod.Namespace, statefulSetName)
1309+
return true
1310+
}
1311+
klog.Errorf("failed to get statefulset %s/%s: %v", pod.Namespace, statefulSetName, err)
1312+
return false
1313+
}
1314+
1315+
// statefulset is being deleted
1316+
if !sts.DeletionTimestamp.IsZero() {
1317+
klog.Infof("statefulset %s/%s is being deleted", pod.Namespace, statefulSetName)
1318+
return true
1319+
}
1320+
// the statefulset has been deleted and recreated
1321+
if sts.UID != statefulSetUID {
1322+
klog.Infof("statefulset %s/%s is a newly created one", pod.Namespace, statefulSetName)
12901323
return true
12911324
}
1325+
1326+
// the statefulset is down scaled and the pod is not alive
1327+
1328+
tempStrs := strings.Split(pod.Name, "-")
1329+
numStr := tempStrs[len(tempStrs)-1]
1330+
index, err := strconv.ParseInt(numStr, 10, 0)
1331+
if err != nil {
1332+
klog.Errorf("failed to parse %s to int", numStr)
1333+
return false
1334+
}
1335+
// down scaled
1336+
var startOrdinal int64
1337+
if sts.Spec.Ordinals != nil {
1338+
startOrdinal = int64(sts.Spec.Ordinals.Start)
1339+
}
1340+
if index >= startOrdinal+int64(*sts.Spec.Replicas) {
1341+
klog.Infof("statefulset %s/%s is down scaled", pod.Namespace, statefulSetName)
1342+
if !isPodAlive(pod) {
1343+
// we must check whether the pod is alive because we have to consider the following case:
1344+
// 1. the statefulset is down scaled to zero
1345+
// 2. the lsp gc is triggered
1346+
// 3. gc interval, e.g. 90s, is passed and the second gc is triggered
1347+
// 4. the sts is up scaled to the original replicas
1348+
// 5. the pod is still running and it will not be recreated
1349+
return true
1350+
}
1351+
}
1352+
12921353
return false
12931354
}
12941355

0 commit comments

Comments
 (0)