This repository has been archived by the owner on Jul 1, 2023. It is now read-only.
-
Notifications
You must be signed in to change notification settings - Fork 32
/
nodesstatus.go
96 lines (84 loc) · 2.69 KB
/
nodesstatus.go
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
/*
Copyright 2017 Gravitational, Inc.
Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at
http://www.apache.org/licenses/LICENSE-2.0
Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
*/
package monitoring
import (
"context"
"fmt"
"github.com/gravitational/satellite/agent/health"
pb "github.com/gravitational/satellite/agent/proto/agentpb"
"github.com/gravitational/trace"
metav1 "k8s.io/apimachinery/pkg/apis/meta/v1"
"k8s.io/apimachinery/pkg/fields"
"k8s.io/apimachinery/pkg/labels"
"k8s.io/client-go/pkg/api/v1"
)
// NewNodesStatusChecker returns a Checker that tests kubernetes nodes availability
func NewNodesStatusChecker(hostPort string, nodesReadyThreshold int) health.Checker {
return &nodesStatusChecker{
hostPort: hostPort,
nodesReadyThreshold: nodesReadyThreshold,
}
}
// nodesStatusChecker tests and reports health failures in kubernetes
// nodes availability
type nodesStatusChecker struct {
name string
hostPort string
nodesReadyThreshold int
}
// Name returns the name of this checker
func (r *nodesStatusChecker) Name() string { return "nodesstatuses" }
// Check validates the status of kubernetes components
func (r *nodesStatusChecker) Check(ctx context.Context, reporter health.Reporter) {
client, err := ConnectToKube(r.hostPort, "")
if err != nil {
reason := "failed to connect to kubernetes apiserver"
reporter.Add(NewProbeFromErr(r.Name(), reason, trace.Wrap(err)))
return
}
listOptions := metav1.ListOptions{
LabelSelector: labels.Everything().String(),
FieldSelector: fields.Everything().String(),
}
statuses, err := client.Nodes().List(listOptions)
if err != nil {
reason := "failed to query nodes"
reporter.Add(NewProbeFromErr(r.Name(), reason, trace.Wrap(err)))
return
}
var nodesReady int
for _, item := range statuses.Items {
for _, condition := range item.Status.Conditions {
if condition.Type != v1.NodeReady {
continue
}
if condition.Status == v1.ConditionTrue {
nodesReady++
continue
}
}
}
if nodesReady < r.nodesReadyThreshold {
reporter.Add(&pb.Probe{
Checker: r.Name(),
Status: pb.Probe_Failed,
Error: fmt.Sprintf("Not enough ready nodes: %v (threshold %v)",
nodesReady, r.nodesReadyThreshold),
})
} else {
reporter.Add(&pb.Probe{
Checker: r.Name(),
Status: pb.Probe_Running,
})
}
}