pkg/controller/controller.go

package controller

import (
	"context"
	"fmt"
	"strconv"
	"time"

	"github.com/lnsp/k8s-crash-informer/pkg/chat"
	"github.com/lnsp/k8s-crash-informer/pkg/client"
	"github.com/lnsp/k8s-crash-informer/pkg/utils"
	"k8s.io/klog"

	appsv1 "k8s.io/api/apps/v1"
	v1 "k8s.io/api/core/v1"
	metav1 "k8s.io/apimachinery/pkg/apis/meta/v1"
	"k8s.io/apimachinery/pkg/fields"
	"k8s.io/apimachinery/pkg/util/runtime"
	"k8s.io/apimachinery/pkg/util/wait"
	"k8s.io/client-go/kubernetes"
	"k8s.io/client-go/tools/cache"
	"k8s.io/client-go/util/workqueue"
)

type Controller struct {
	queue           workqueue.RateLimitingInterface
	cacheIndexer    cache.Indexer
	cacheController cache.Controller
	chat            chat.Client
	clientset       kubernetes.Interface

	timeouts map[string]time.Time
}

func (c *Controller) processNextItem() bool {
	// Wait until there is a new item in the working queue
	key, quit := c.queue.Get()
	if quit {
		return false
	}
	// Tell the queue that we are done with processing this key. This unblocks the key for other workers
	// This allows safe parallel processing because two pods with the same key are never processed in
	// parallel.
	defer c.queue.Done(key)

	// Invoke the method containing the business logic
	err := c.syncToStdout(key.(string))
	// Handle the error if something went wrong during the execution of the business logic
	c.handleErr(err, key)
	return true
}

const (
	annotationEnableMattermost       = "espe.tech/crash-informer"
	annotationEnableMattermostInform = "true"
)

func (c *Controller) hasValidAnnotation(pod *v1.Pod) bool {
	podAnnotations := pod.ObjectMeta.Annotations
	if podAnnotations == nil {
		podAnnotations = make(map[string]string)
	}
	if podAnnotations[annotationEnableMattermost] == annotationEnableMattermostInform {
		return true
	}
	// Backtrack to deployment using ownerReferences
	rs, err := c.findPodReplicaSet(pod)
	if err != nil {
		klog.Infof("Failed to get replicaset: %v", err)
		return false
	}
	rsAnnotations := rs.ObjectMeta.Annotations
	if rsAnnotations == nil {
		rsAnnotations = make(map[string]string)
	}
	podAnnotations[annotationMattermostBackoff] = rsAnnotations[annotationMattermostBackoff]
	if rsAnnotations[annotationEnableMattermost] == annotationEnableMattermostInform {
		return true
	}
	dep, err := c.findPodDeployment(pod, rs)
	if err != nil {
		klog.Infof("Failed to get deployment: %v", err)
		return false
	}
	depAnnotations := dep.ObjectMeta.Annotations
	if depAnnotations == nil {
		depAnnotations = make(map[string]string)
	}
	podAnnotations[annotationMattermostBackoff] = depAnnotations[annotationMattermostBackoff]
	return depAnnotations[annotationEnableMattermost] == annotationEnableMattermostInform
}

func (c *Controller) findPodReplicaSet(pod *v1.Pod) (*appsv1.ReplicaSet, error) {
	for _, ref := range pod.GetOwnerReferences() {
		if ref.Kind == "ReplicaSet" {
			rs, err := c.clientset.AppsV1().ReplicaSets(pod.Namespace).Get(context.Background(), ref.Name, metav1.GetOptions{})
			if err != nil {
				return nil, fmt.Errorf("failed to retrieve owner ref: %w", err)
			}
			return rs, nil
		}
	}
	return nil, fmt.Errorf("replicaset not found")
}

func (c *Controller) findPodDeployment(pod *v1.Pod, rs *appsv1.ReplicaSet) (*appsv1.Deployment, error) {
	for _, ref := range rs.GetOwnerReferences() {
		if ref.Kind == "Deployment" {
			dep, err := c.clientset.AppsV1().Deployments(pod.Namespace).Get(context.Background(), ref.Name, metav1.GetOptions{})
			if err != nil {
				return nil, fmt.Errorf("failed to retrieve owner ref: %w", err)
			}
			return dep, nil
		}
	}
	return nil, fmt.Errorf("deployment not found")
}

const (
	annotationMattermostBackoff        = "espe.tech/informer-backoff"
	annotationMattermostBackoffDefault = time.Minute * 10
)

func (c *Controller) refreshBackoff(pod *v1.Pod, container *v1.ContainerStatus) bool {
	backoff := annotationMattermostBackoffDefault
	if backoffVal := pod.GetObjectMeta().GetAnnotations()[annotationMattermostBackoff]; backoffVal != "" {
		seconds, err := strconv.Atoi(backoffVal)
		if err != nil {
			klog.Warningf("Pod %s has invalid backoff interval: '%s'", pod.GetName(), backoffVal)
			return false
		}
		backoff = time.Duration(seconds) * time.Second
	}
	if time.Since(c.timeouts[pod.GetName()]) < backoff {
		return false
	}
	c.timeouts[pod.GetName()] = time.Now()
	return true
}

func (c *Controller) clearTimeout(pod *v1.Pod) {
	delete(c.timeouts, pod.GetName())
}

func (c *Controller) sendCrashNotification(pod *v1.Pod, container *v1.ContainerStatus) {
	logs, _ := c.clientset.
		CoreV1().Pods(pod.Namespace).
		GetLogs(pod.Name, &v1.PodLogOptions{Container: container.Name}).Do(context.Background()).Raw()
	message := fmt.Sprintf("Container %s of pod %s keeps crashing, maybe its time to intervene.", container.Name, pod.Name)
	note := &chat.CrashNotification{
		Title:   "Crash loop detected!",
		Message: message,
		Logs:    string(logs),
	}
	if container.LastTerminationState.Terminated != nil {
		note.Reason = container.LastTerminationState.Terminated.Reason
	}
	c.chat.Send(note)
}

func (c *Controller) handlePodUpdate(pod *v1.Pod) {
	for _, container := range pod.Status.ContainerStatuses {
		if !container.Ready && container.State.Waiting != nil && c.hasValidAnnotation(pod) {
			switch container.State.Waiting.Reason {
			case "CrashLoopBackOff":
				if !c.refreshBackoff(pod, &container) {
					continue
				}
				c.sendCrashNotification(pod, &container)
			}
		}
	}
}

// syncToStdout is the business logic of the controller. In this controller it simply prints
// information about the pod to stdout. In case an error happened, it has to simply return the error.
// The retry logic should not be part of the business logic.
func (c *Controller) syncToStdout(key string) error {
	obj, exists, err := c.cacheIndexer.GetByKey(key)
	if err != nil {
		klog.Errorf("Fetching object with key %s from store failed with %v", key, err)
		return err
	}
	if !exists {
		// Below we will warm up our cache with a Pod, so that we will see a delete for one pod
		klog.Infof("Pod %s does not exist anymore\n", key)
		// Clean up intervals if possible
		if obj != nil {
			c.clearTimeout(obj.(*v1.Pod))
		}
	} else {
		klog.Infof("Received create/update/delete for Pod %s\n", key)
		// Note that you also have to check the uid if you have a local controlled resource, which
		// is dependent on the actual instance, to detect that a Pod was recreated with the same name
		c.handlePodUpdate(obj.(*v1.Pod))
	}
	return nil
}

// handleErr checks if an error happened and makes sure we will retry later.
func (c *Controller) handleErr(err error, key interface{}) {
	if err == nil {
		// Forget about the #AddRateLimited history of the key on every successful synchronization.
		// This ensures that future processing of updates for this key is not delayed because of
		// an outdated error history.
		c.queue.Forget(key)
		return
	}

	// This controller retries 5 times if something goes wrong. After that, it stops trying.
	if c.queue.NumRequeues(key) < 5 {
		klog.Infof("Error syncing pod %v: %v", key, err)

		// Re-enqueue the key rate limited. Based on the rate limiter on the
		// queue and the re-enqueue history, the key will be processed later again.
		c.queue.AddRateLimited(key)
		return
	}

	c.queue.Forget(key)
	// Report to an external entity that, even after several retries, we could not successfully process this key
	runtime.HandleError(err)
	klog.Infof("Dropping pod %q out of the queue: %v", key, err)
}

func (c *Controller) Run(threadiness int, stopCh chan struct{}) {
	defer runtime.HandleCrash()

	// Let the workers stop when we are done
	defer c.queue.ShutDown()
	klog.Info("Starting Pod controller")

	go c.cacheController.Run(stopCh)

	// Wait for all involved caches to be synced, before processing items from the queue is started
	if !cache.WaitForCacheSync(stopCh, c.cacheController.HasSynced) {
		runtime.HandleError(fmt.Errorf("Timed out waiting for caches to sync"))
		return
	}

	for i := 0; i < threadiness; i++ {
		go wait.Until(c.runWorker, time.Second, stopCh)
	}

	<-stopCh
	klog.Info("Stopping Pod controller")
}

func (c *Controller) runWorker() {
	for c.processNextItem() {
	}
}

func Run() {
	klog.InitFlags(nil)

	chat, err := chat.NewClientFromEnv()
	if err != nil {
		klog.Fatal(err)
	}

	klog.Info("Chat client configuration successful")
	clientset, err := client.InCluster()
	if err != nil {
		klog.Fatal(err)
	}

	namespace, err := utils.Namespace()
	if err != nil {
		klog.Fatal(err)
	}
	klog.Infof("Watching namespace %s", namespace)

	// create the pod watcher
	podListWatcher := cache.NewListWatchFromClient(clientset.CoreV1().RESTClient(), "pods", namespace, fields.Everything())

	// create the workqueue
	queue := workqueue.NewRateLimitingQueue(workqueue.DefaultControllerRateLimiter())

	// Bind the workqueue to a cache with the help of an informer. This way we make sure that
	// whenever the cache is updated, the pod key is added to the workqueue.
	// Note that when we finally process the item from the workqueue, we might see a newer version
	// of the Pod than the version which was responsible for triggering the update.
	indexer, informer := cache.NewIndexerInformer(podListWatcher, &v1.Pod{}, 0, cache.ResourceEventHandlerFuncs{
		AddFunc: func(obj interface{}) {
			key, err := cache.MetaNamespaceKeyFunc(obj)
			if err == nil {
				queue.Add(key)
			}
		},
		UpdateFunc: func(old interface{}, new interface{}) {
			key, err := cache.MetaNamespaceKeyFunc(new)
			if err == nil {
				queue.Add(key)
			}
		},
		DeleteFunc: func(obj interface{}) {
			// IndexerInformer uses a delta queue, therefore for deletes we have to use this
			// key function.
			key, err := cache.DeletionHandlingMetaNamespaceKeyFunc(obj)
			if err == nil {
				queue.Add(key)
			}
		},
	}, cache.Indexers{})

	controller := &Controller{
		clientset:       clientset,
		chat:            chat,
		cacheIndexer:    indexer,
		cacheController: informer,
		queue:           queue,
		timeouts:        make(map[string]time.Time),
	}

	stop := make(chan struct{})
	defer close(stop)
	go controller.Run(1, stop)

	// Wait forever
	select {}
}