/
tpcds_controller.go
144 lines (120 loc) · 5.19 KB
/
tpcds_controller.go
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
/*
Copyright 2023.
Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at
http://www.apache.org/licenses/LICENSE-2.0
Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
*/
package controller
import (
"context"
"fmt"
"k8s.io/client-go/rest"
"k8s.io/apimachinery/pkg/runtime"
ctrl "sigs.k8s.io/controller-runtime"
"sigs.k8s.io/controller-runtime/pkg/client"
"sigs.k8s.io/controller-runtime/pkg/controller/controllerutil"
"sigs.k8s.io/controller-runtime/pkg/log"
benchmarkv1alpha1 "github.com/apecloud/kubebench/api/v1alpha1"
intctrlutil "github.com/apecloud/kubebench/internal/controllerutil"
"github.com/apecloud/kubebench/internal/utils"
)
// TpcdsReconciler reconciles a Tpcds object
type TpcdsReconciler struct {
client.Client
Scheme *runtime.Scheme
RestConfig *rest.Config
}
//+kubebuilder:rbac:groups=benchmark.apecloud.io,resources=tpcds,verbs=get;list;watch;create;update;patch;delete
//+kubebuilder:rbac:groups=benchmark.apecloud.io,resources=tpcds/status,verbs=get;update;patch
//+kubebuilder:rbac:groups=benchmark.apecloud.io,resources=tpcds/finalizers,verbs=update
// Reconcile is part of the main kubernetes reconciliation loop which aims to
// move the current state of the cluster closer to the desired state.
// TODO(user): Modify the Reconcile function to compare the state specified by
// the Tpcds object against the actual cluster state, and then
// perform operations to make the cluster state reflect the state specified by
// the user.
//
// For more details, check Reconcile and its Result here:
// - https://pkg.go.dev/sigs.k8s.io/controller-runtime@v0.15.0/pkg/reconcile
func (r *TpcdsReconciler) Reconcile(ctx context.Context, req ctrl.Request) (ctrl.Result, error) {
l := log.FromContext(ctx)
var tpcds benchmarkv1alpha1.Tpcds
if err := r.Get(ctx, req.NamespacedName, &tpcds); err != nil {
l.Error(err, "unable to fetch Tpcds")
return ctrl.Result{}, client.IgnoreNotFound(err)
}
old := tpcds.DeepCopy()
// if tpcds completed or failed, do nothing
if tpcds.Status.Phase == benchmarkv1alpha1.Completed || tpcds.Status.Phase == benchmarkv1alpha1.Failed {
return intctrlutil.Reconciled()
}
jobs := NewTpcdsJobs(tpcds)
if tpcds.Status.Phase == "" {
l.Info("start tpcds", "tpcds", tpcds.Name)
tpcds.Status.Phase = benchmarkv1alpha1.Running
tpcds.Status.Total = len(jobs)
}
if tpcds.Status.Succeeded >= tpcds.Status.Total {
tpcds.Status.Phase = benchmarkv1alpha1.Completed
} else {
job := jobs[tpcds.Status.Succeeded]
existed, err := utils.IsJobExisted(r.Client, ctx, job.Name, tpcds.Namespace)
if err != nil {
l.Error(err, "failed to check if job exists", "job", job.Name)
return intctrlutil.RequeueWithError(err, l, "failed to check if job exists")
}
if !existed {
if err = controllerutil.SetOwnerReference(&tpcds, job, r.Scheme); err != nil {
l.Error(err, "failed to set owner reference for job", "job", job.Name)
return intctrlutil.RequeueWithError(err, l, "failed to set owner reference for job")
}
if err = r.Create(ctx, job); err != nil {
l.Error(err, "failed to create job", "job", job.Name)
return intctrlutil.RequeueWithError(err, l, "failed to create job")
}
// wait for the job to be created
l.Info("created job", "job", job.Name)
return intctrlutil.RequeueAfter(intctrlutil.RequeueDuration)
}
// check if the job is completed
status, err := utils.GetJobStatus(r.Client, ctx, job.Name, job.Namespace)
if err != nil {
l.Error(err, "failed to get job status", "job", job.Name)
return intctrlutil.RequeueWithError(err, l, "failed to get job status")
}
if status.Succeeded > 0 {
l.Info("job completed", "job", job.Name)
tpcds.Status.Succeeded++
// record the result
if err := utils.LogJobPodToCond(r.Client, r.RestConfig, ctx, job.Name, tpcds.Namespace, &tpcds.Status.Conditions, nil); err != nil {
return intctrlutil.RequeueWithError(err, l, "unable to record the log")
}
} else if status.Failed > 0 {
l.Info("job failed", "job", job.Name)
tpcds.Status.Phase = benchmarkv1alpha1.Failed
if err := utils.LogJobPodToCond(r.Client, r.RestConfig, ctx, job.Name, tpcds.Namespace, &tpcds.Status.Conditions, nil); err != nil {
return intctrlutil.RequeueWithError(err, l, "unable to record the log")
}
} else {
l.Info("job is running", "job", job.Name)
}
}
tpcds.Status.Completions = fmt.Sprintf("%d/%d", tpcds.Status.Succeeded, tpcds.Status.Total)
if err := r.Status().Patch(ctx, &tpcds, client.MergeFrom(old)); err != nil {
l.Error(err, "failed to patch tpcds status")
return intctrlutil.RequeueWithError(err, l, "failed to patch tpcds status")
}
return intctrlutil.RequeueAfter(intctrlutil.RequeueDuration)
}
// SetupWithManager sets up the controller with the Manager.
func (r *TpcdsReconciler) SetupWithManager(mgr ctrl.Manager) error {
return ctrl.NewControllerManagedBy(mgr).
For(&benchmarkv1alpha1.Tpcds{}).
Complete(r)
}