-
Notifications
You must be signed in to change notification settings - Fork 134
/
pod_utilisation_kubelet_metrics.go
69 lines (60 loc) · 2.25 KB
/
pod_utilisation_kubelet_metrics.go
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
package utilisation
import (
"context"
"sync"
"time"
"k8s.io/apimachinery/pkg/api/resource"
"k8s.io/kubelet/pkg/apis/stats/v1alpha1"
log "github.com/sirupsen/logrus"
v1 "k8s.io/api/core/v1"
clusterContext "github.com/armadaproject/armada/internal/executor/context"
"github.com/armadaproject/armada/internal/executor/domain"
)
type podUtilisationKubeletMetrics struct{}
func newPodUtilisationKubeletMetrics() *podUtilisationKubeletMetrics {
return &podUtilisationKubeletMetrics{}
}
func (m *podUtilisationKubeletMetrics) fetch(nodes []*v1.Node, podNameToUtilisationData map[string]*domain.UtilisationData, clusterContext clusterContext.ClusterContext) {
summaries := make(chan *v1alpha1.Summary, len(nodes))
wg := sync.WaitGroup{}
for _, n := range nodes {
wg.Add(1)
go func(node *v1.Node) {
defer wg.Done()
ctx, cancelFunc := context.WithTimeout(context.Background(), time.Second*15)
defer cancelFunc()
summary, err := clusterContext.GetNodeStatsSummary(ctx, node)
if err != nil {
log.Warnf("Error when getting stats for node %s: %s", node.Name, err)
return
}
summaries <- summary
}(n)
}
go func() {
wg.Wait()
close(summaries)
}()
for s := range summaries {
for _, podStats := range s.Pods {
utilisationData, exists := podNameToUtilisationData[podStats.PodRef.Name]
if exists {
updatePodStats(&podStats, utilisationData)
}
}
}
}
func updatePodStats(podStats *v1alpha1.PodStats, utilisationData *domain.UtilisationData) {
if podStats.CPU != nil && podStats.CPU.UsageNanoCores != nil {
utilisationData.CurrentUsage["cpu"] = *resource.NewScaledQuantity(int64(*podStats.CPU.UsageNanoCores), -9)
}
if podStats.CPU != nil && podStats.CPU.UsageCoreNanoSeconds != nil {
utilisationData.CumulativeUsage["cpu"] = *resource.NewScaledQuantity(int64(*podStats.CPU.UsageCoreNanoSeconds), -9)
}
if podStats.Memory != nil && podStats.Memory.WorkingSetBytes != nil {
utilisationData.CurrentUsage["memory"] = *resource.NewQuantity(int64(*podStats.Memory.WorkingSetBytes), resource.BinarySI)
}
if podStats.EphemeralStorage != nil && podStats.EphemeralStorage.UsedBytes != nil {
utilisationData.CurrentUsage["ephemeral-storage"] = *resource.NewQuantity(int64(*podStats.EphemeralStorage.UsedBytes), resource.BinarySI)
}
}