From c8f6276beb658aaacf77060a15a05b1e06537401 Mon Sep 17 00:00:00 2001 From: qi liang Date: Mon, 4 Nov 2024 15:31:22 +0800 Subject: [PATCH 1/2] Add unknownMember status for etcd controller Signed-off-by: qi liang --- pkg/etcd/etcd.go | 19 +++++++++++++------ 1 file changed, 13 insertions(+), 6 deletions(-) diff --git a/pkg/etcd/etcd.go b/pkg/etcd/etcd.go index dfcce5433658..99d5496258e4 100644 --- a/pkg/etcd/etcd.go +++ b/pkg/etcd/etcd.go @@ -82,10 +82,11 @@ const ( etcdStatusType = v1.NodeConditionType("EtcdIsVoter") - StatusUnjoined MemberStatus = "unjoined" - StatusUnhealthy MemberStatus = "unhealthy" - StatusLearner MemberStatus = "learner" - StatusVoter MemberStatus = "voter" + StatusUnjoined MemberStatus = "unjoined" + StatusUnhealthy MemberStatus = "unhealthy" + StatusLearner MemberStatus = "learner" + StatusVoter MemberStatus = "voter" + StatusUnknownMember MemberStatus = "unknownMember" ) var ( @@ -1189,6 +1190,7 @@ func (e *ETCD) manageLearners(ctx context.Context) { // a map to track if a node is a member of the etcd cluster or not nodeIsMember := make(map[string]bool) nodesMap := make(map[string]*v1.Node) + membersWithoutNode := "" for _, node := range nodes { nodeIsMember[node.Name] = false nodesMap[node.Name] = node @@ -1214,7 +1216,7 @@ func (e *ETCD) manageLearners(ctx context.Context) { } } if node == nil { - continue + membersWithoutNode += (" " + member.Name) } // verify if the member is healthy and set the status @@ -1229,7 +1231,12 @@ func (e *ETCD) manageLearners(ctx context.Context) { } for nodeName, node := range nodesMap { - if !nodeIsMember[nodeName] { + if len(membersWithoutNode) > 0 { + statusMsg := fmt.Sprintf("unknown etcd members:%s", membersWithoutNode) + if err := e.setEtcdStatusCondition(node, client, nodeName, StatusUnknownMember, statusMsg); err != nil { + logrus.Errorf("Unable to set etcd status condition for node %s: %v", node.Name, err) + } + } else if !nodeIsMember[nodeName] { if err := e.setEtcdStatusCondition(node, client, nodeName, StatusUnjoined, ""); err != nil { logrus.Errorf("Unable to set etcd status condition for a node that is not a cluster member %s: %v", nodeName, err) } From aaa025ec5b22b9f60d02feb16925b81dee12d5de Mon Sep 17 00:00:00 2001 From: qi liang Date: Mon, 4 Nov 2024 15:40:12 +0800 Subject: [PATCH 2/2] fix Signed-off-by: qi liang --- pkg/etcd/etcd.go | 7 +++++++ 1 file changed, 7 insertions(+) diff --git a/pkg/etcd/etcd.go b/pkg/etcd/etcd.go index 99d5496258e4..52b28a417055 100644 --- a/pkg/etcd/etcd.go +++ b/pkg/etcd/etcd.go @@ -1352,6 +1352,13 @@ func (e *ETCD) setEtcdStatusCondition(node *v1.Node, client kubernetes.Interface Reason: "NotAMember", Message: "Node is not a member of the etcd cluster", } + case StatusUnknownMember: + newCondition = v1.NodeCondition{ + Type: etcdStatusType, + Status: "False", + Reason: "UnknownMember", + Message: "unknown member detected in etcd cluster", + } default: logrus.Warnf("Unknown etcd member status %s", memberStatus) return nil