pkg/cdule/schedule_watcher.go

package cdule

import (
	"encoding/json"
	"reflect"
	"sort"
	"sync"
	"time"

	"github.com/deepaksinghvi/cdule/pkg"
	"github.com/deepaksinghvi/cdule/pkg/model"

	"github.com/robfig/cron/v3"
	log "github.com/sirupsen/logrus"
	"gorm.io/gorm"
)

// ScheduleWatcher struct
type ScheduleWatcher struct {
	Closed chan struct{}
	WG     sync.WaitGroup
	Ticker *time.Ticker
}

var lastScheduleExecutionTime int64
var nextScheduleExecutionTime int64

// Run to run watcher in a continuous loop
func (t *ScheduleWatcher) Run() {
	for {
		select {
		case <-t.Closed:
			return
		case <-t.Ticker.C:
			now := time.Now()
			lastScheduleExecutionTime = now.Add(-1 * time.Minute).UnixNano()
			nextScheduleExecutionTime = now.UnixNano()

			log.Infof("lastScheduleExecutionTime %d, nextScheduleExecutionTime %d", lastScheduleExecutionTime, nextScheduleExecutionTime)
			runNextScheduleJobs(lastScheduleExecutionTime, nextScheduleExecutionTime)
		}
	}
}

// Stop to stop scheduler watcher
func (t *ScheduleWatcher) Stop() {
	close(t.Closed)
	t.WG.Wait()
}

func runNextScheduleJobs(scheduleStart, scheduleEnd int64) {
	defer panicRecoveryForSchedule()

	schedules, err := model.CduleRepos.CduleRepository.GetScheduleBetween(scheduleStart, scheduleEnd, WorkerID)
	if nil != err {
		log.Error(err)
		return
	}
	workers, err := model.CduleRepos.CduleRepository.GetWorkers()
	if nil != err {
		log.Error(err)
		return
	}
	for _, schedule := range schedules {
		scheduledJob, err := model.CduleRepos.CduleRepository.GetJob(schedule.JobID)
		if nil != err {
			log.Errorf("Error while running Schedule for %d : %s", schedule.JobID, err.Error())
			continue
		}
		log.Info("====START====")
		log.Infof("Schedule for JobName: %s, Exeuction Time %d at Worker %s", scheduledJob.JobName, schedule.ExecutionID, schedule.WorkerID)
		jobDataStr := schedule.JobData
		var jobDataMap map[string]string
		if pkg.EMPTYSTRING != jobDataStr {
			err = json.Unmarshal([]byte(jobDataStr), &jobDataMap)
			if nil != err {
				log.Error(err)
				continue
			}
		}
		var jobHistory *model.JobHistory
		if err == nil {
			jobHistory, err = model.CduleRepos.CduleRepository.GetJobHistoryForSchedule(schedule.ExecutionID)
			j := JobRegistry[scheduledJob.JobName]
			jobInstance := reflect.New(j).Elem().Interface()

			if err != nil && err.Error() == "record not found" && jobHistory != nil {
				// if job history was present but not executed
				if jobHistory.Status == model.JobStatusNew {
					jobHistory.Status = model.JobStatusInProgress
					model.CduleRepos.CduleRepository.UpdateJobHistory(jobHistory)
					jobInstance.(Job).Execute(jobDataMap)
					jobDataMap = jobInstance.(Job).GetJobData()
				}
			} else {
				// if job history is not there for this schedule, so this should be executed.
				jobHistory = &model.JobHistory{
					JobID:       schedule.JobID,
					ExecutionID: schedule.ExecutionID,
					DeletedAt:   gorm.DeletedAt{},
					Status:      model.JobStatusNew,
					WorkerID:    schedule.WorkerID,
					RetryCount:  0,
				}
				model.CduleRepos.CduleRepository.CreateJobHistory(jobHistory)
				jobHistory.Status = model.JobStatusInProgress
				model.CduleRepos.CduleRepository.UpdateJobHistory(jobHistory)

				jobDataMap = executeJob(jobInstance, jobHistory, &jobDataMap)
				log.Infof("Job Execution Completed For JobName: %s JobID: %d on Worker: %s", scheduledJob.JobName, schedule.JobID, schedule.WorkerID)
				log.Info("====END====\n")
			}
			// Calculate the next schedule for the current job
			jobDataBytes, err := json.Marshal(jobDataMap)
			if nil != err {
				log.Errorf("Error %s for JobName %s and Schedule ID %d ", err.Error(), scheduledJob.JobName, schedule.ExecutionID)
			}
			if string(jobDataBytes) != pkg.EMPTYSTRING {
				jobDataStr = string(jobDataBytes)
			}
			SchedulerParser, err := cron.NewParser(cron.Second | cron.Minute | cron.Hour | cron.Dom | cron.Month | cron.Dow).Parse(scheduledJob.CronExpression)
			if err != nil {
				log.Error(err.Error())
				return
			}
			nextRunTime := SchedulerParser.Next(time.Now()).UnixNano()

			workerIDForNextRun, _ := findNextAvailableWorker(workers, schedule)
			newSchedule := model.Schedule{
				ExecutionID: nextRunTime,
				CreatedAt:   time.Now(),
				UpdatedAt:   time.Now(),
				DeletedAt:   gorm.DeletedAt{},
				WorkerID:    workerIDForNextRun,
				JobID:       schedule.JobID,
				JobData:     jobDataStr,
			}
			model.CduleRepos.CduleRepository.CreateSchedule(&newSchedule)
			log.Infof("*** Next Job Scheduled Info ***\n JobName: %s,\n Schedule Cron: %s,\n Job Scheduled Time: %d,\n Worker: %s ",
				scheduledJob.JobName, scheduledJob.CronExpression, newSchedule.ExecutionID, newSchedule.WorkerID)
		}
	}
	log.Infof("Schedules Completed For StartTime %d To EndTime %d", scheduleStart, scheduleEnd)
}

// WorkerJobCount struct
type WorkerJobCount struct {
	WorkerID string `json:"worker_id"`
	Count    int64  `json:"count"`
}

func findNextAvailableWorker(workers []model.Worker, schedule model.Schedule) (string, error) {
	workerName := schedule.WorkerID
	var workerJobCountMetrics []WorkerJobCount
	model.DB.Raw("SELECT worker_id, count(1) FROM job_histories WHERE job_id = ? group by worker_id", schedule.JobID).Scan(&workerJobCountMetrics)
	log.Infof("workerJobCountMetrics %v", workerJobCountMetrics)
	if len(workerJobCountMetrics) <= 0 {
		log.Infof("workerName %s would be used", workerName)
		return workerName, nil
	}
	for _, worker := range workers {
		appendWorker := true
		for _, v := range workerJobCountMetrics {
			if v.WorkerID == worker.WorkerID {
				appendWorker = false
				break
			}
		}
		if appendWorker {
			newWorkerMetric := WorkerJobCount{
				WorkerID: worker.WorkerID,
				Count:    0,
			}
			workerJobCountMetrics = append(workerJobCountMetrics, newWorkerMetric)
		}
	}
	sort.Slice(workerJobCountMetrics[:], func(i, j int) bool {
		return workerJobCountMetrics[i].Count < workerJobCountMetrics[j].Count
	})
	return workerJobCountMetrics[0].WorkerID, nil
}

/*
For go 1.17 following method can be used.
func executeJob(jobInstance interface{}, jobHistory *model.JobHistory, jobDataMap map[string]string) {
	defer panicRecovery(jobHistory)
	jobInstance.(job.Job).Execute(jobDataMap)
}
*/

/*
cdule library has been built and developed using go 1.18 (go1.18beta2), if you need to use it for 1.17
then build from source by uncommenting the above method and comment the following
*/
func executeJob(jobInstance any, jobHistory *model.JobHistory, jobDataMap *map[string]string) map[string]string {
	defer panicRecovery(jobHistory)
	jobInstance.(Job).Execute(*jobDataMap)
	return jobInstance.(Job).GetJobData()
}

// If there is any panic from Job Execution, set the JobStatus as FAILED
func panicRecovery(jobHistory *model.JobHistory) {
	// TODO should be handled for any panic and set the status as FAILED for job history with error message
	jobHistory.Status = model.JobStatusCompleted
	if r := recover(); r != nil {
		log.Warning("Recovered in panicRecovery for job execution ", r)
		jobHistory.Status = model.JobStatusFailed
	}
	model.CduleRepos.CduleRepository.UpdateJobHistory(jobHistory)
}

func panicRecoveryForSchedule() {
	if r := recover(); r != nil {
		log.Warning("Recovered in runNextScheduleJobs ", r)
	}
}