src/ablauf/job.clj

(ns ablauf.job
  "
  An abstract program runtime for ASTs produced by `ablauf.job.ast`.
  This exposes two functions for the outside world: `make`
  and `restart`

  You are expected to create a *program* to be ran with the functions
  available in the `ablauf.job.ast` namespace. This program is then
  initialized with the rough equivalent of an instruction pointer and
  a context.

  This namespace makes no guess as to how program instructions are
  actually performed, instead, for each position of the program,
  it yields the instructions to carry out. There might be more than
  one if parallelism is used.

  The logical flow is thus:

  - call restart on a program with an empty result list
  - carry out resulting actions
  - call restart on the result of the actions

  For an actual full fledged program runner, a runner using
  **manifold** as the underlying dispatching engine is provided
  in `ablauf.job.manifold`, an SQL backed one in `ablauf.job.sql`.
"
  (:require [clojure.zip        :as zip]
            [clojure.spec.alpha :as s]
            [ablauf.job.ast     :as ast]
            [ablauf.job.node    :as node]
            [exoscale.ex        :as-alias ex]))

(defn ast-zip
  "Given a well-formed AST (as per `ablauf.job.ast`), yield a zipper"
  [ast]
  (zip/zipper ast/branch? :ast/nodes #(assoc %1 :ast/nodes (vec %2)) ast))

(defn augmentable?
  "Predicate to test for an augmentable node"
  [{:ast/keys [augment] :as node}]
  (and (some? node)
       (some?
        (:augment/source augment))
       (some?
        (:augment/dest augment))))

(defn- errored?
  "Predicate to test for errored nodes"
  [{:exec/keys [result] :as node}]
  (and (some? node)
       (not= :result/success result)))

(defn- lift-error
  "Convenience function to store the last leaf error in the
   context. Can be thought of as the equivalent of Clojure's `*e`"
  [context {:exec/keys [output]}]
  (assoc context :exec/last-error output))

(defn augment
  "When an AST node contains an `augment` key, process it to
   augment the resulting context. Augments have a source:
   a function of the output, a keyword or vector, of keyword
   pointing to a path in the output. Augments also have a destination
   a key or key vector of the position in which to augment the context."
  [context {:ast/keys [augment] :exec/keys [result output]}]
  (let [{:augment/keys [source dest]} augment
        dest-vec                      (if (sequential? dest) dest [dest])]
    (cond-> context
      (= :result/success result)
      (assoc-in dest-vec
                (cond
                  (sequential? source) (get-in output source)
                  (= 'identity source) output
                  (keyword? source)    (get output source)
                  :else                (throw (ex-info
                                               "unknown augment source"
                                               {::ex/type ::ex/incorrect
                                                :source   source})))))))

(defn merge-results
  "Updates a job given a list of node updates. Node updates
   either come from an action dispatch return, or from newly
   found dispatchs."
  [job context nodes]
  (if (empty? nodes)
    [job context]
    (loop [context context
           pos     job
           nodes   nodes]
      (let [node    (first nodes)
            context (cond-> context
                      (augmentable? node)
                      (augment node)
                      (errored? node)
                      (lift-error node))]
        (cond
          (nil? node)
          [(ast-zip (zip/root pos)) context]

          (zip/end? pos)
          (throw (ex-info (format "unknown job node: %s" (:ast/id node))
                          {::ex/type ::ex/incorrect
                           :pos      pos
                           :node     node}))

          (= (:ast/id node) (:ast/id (zip/node pos)))
          (recur context
                 (-> pos (zip/edit merge node) (zip/next))
                 (rest nodes))

          :else
          (recur context
                 (zip/next pos)
                 nodes))))))

(defn merge-dispatchs
  [job nodes]
  (if (empty? nodes)
    job
    (loop [pos   job
           nodes nodes]
      (let [node (first nodes)]
        (cond
          (nil? node)
          (ast-zip (zip/root pos))

          (zip/end? pos)
          (throw (ex-info (format "unknown job node: %s" (:ast/id node))
                          {::ex/type ::ex/incorrect
                           :pos      pos
                           :node     node}))

          (= (:ast/id node) (:ast/id (zip/node pos)))
          (recur (-> pos (zip/edit merge node) (zip/next)) (rest nodes))

          :else
          (recur (zip/next pos) nodes))))))

(defn- update-tree [job & {:keys [pred action remove?]}]
  (loop [loc job]
    (let [node (zip/node loc)]
      (cond
        (zip/end? loc)
        (ast-zip (zip/root loc))

        (pred node)
        (recur (zip/next (if (true? remove?)
                           (zip/remove loc)
                           (zip/edit loc action))))

        :else
        (recur (zip/next loc))))))

(defn- idempotent->unstarted! [job]
  ;; failed leafs can also be retried
  (update-tree job
               :pred #(and (node/idempotent? %1)
                           (or (node/pending? %1)
                               (node/failed? %1)))
               :action #(dissoc %1 :exec/result)))

(defn- pending->failure!
  ([job]
   (pending->failure! job nil))
  ([job reason]
   (update-tree job
                :pred #(and
                        (ast/leaf? %1)
                        (node/pending? %1))
                :action #(cond-> %1
                           reason
                           (assoc :exec/reason reason)
                           :else
                           (assoc :exec/result :result/failure)))))

(defn remove-nodes-by
  "Removes any node that returns true for `(f node)`. Can be a leaf or not."
  [job f]
  (update-tree job
               :pred #(f %1)
               :remove? true))

(defn abort
  "Given a job, mark pending all pending leafs as failure with the proper reason.
   Yields an updated job."
  ([job]
   (abort job "aborted"))
  ([job reason]
   (pending->failure! job reason)))

(defn prepare-replay
  "It will traverse the whole job and:
    1. mark as unstarted all (pending or failed) idempotent leafs
    2. mark as failure all pending non idempotent leafs

    Yields the modified job"
  [job]
  (-> job
      ;pending-idempotent->unstarted!
      idempotent->unstarted!
      pending->failure!))

(defn find-dispatchs
  [job]
  (node/find-dispatchs (zip/node job)))

(defn restart
  "Given a job, and node updates for it, figure
   out the next course of action to take.

   Yields an updated job and potential side-effects.
   The result has the following structure:

       [job context dispatchs]

   This allows using the return of `restart` as an accumulator
   for `reductions` or similar functions."
  [[job context] results]
  (let [[job context] (merge-results job context results)
        dispatchs     (find-dispatchs job)]
    [(merge-dispatchs job dispatchs) context dispatchs]))

(defn index-ast
  "Uniquely identifies job nodes, for later merging"
  [pos]
  (loop [i   0
         pos pos]
    (cond
      (zip/end? pos)
      [(ast-zip (zip/node pos))]

      (nil? (zip/node pos))
      (recur i (zip/next pos))

      :else
      (recur (inc i) (zip/next (zip/edit pos assoc :ast/id i))))))

(defn make
  "Creates a job, suitable for `restart` from a valid AST as
   produced by functions in `ablauf.job.ast`"
  [ast]
  (when-not (s/valid? ::ast/ast ast)
    (throw (ex-info (s/explain ::ast/ast ast)
                    {:ast ast ::ex/type ::ex/incorrect})))
  (index-ast (ast-zip ast)))

(defn make-with-context
  "Creates a job, attaching an initial context map, as for `make`,
   this creates a tuple suitable for `restart`"
  [ast context]
  (conj (make ast) context))

(defn reload
  "Yield a job ready for restart from a data ast and an optional context."
  [ast context]
  [(ast-zip ast) (if (some? context) context {})])

(defn done?
  "Predicate to test for completion of a (sub)job
   Here is the per-status breakdown:

   | status | `done?` |
   |--------|---------|
   | `:job/failure` | Y |
   | `:job/success` | Y |
   | `:job/pending` | N |
  "
  [job]
  (node/done? (zip/node job)))

(defn failed?
  "Predicate to test for failure of a (sub)job
   Here is the per-status breakdown:

   | status | `failed?` |
   |--------|---------|
   | `:job/failure` | Y |
   | `:job/success` | N |
   | `:job/pending` | N |
  "
  [job]
  (node/failed? (zip/node job)))

(defn pending?
  "Predicate to test for pending completion of a (sub)job
   Here is the per-status breakdown:

   | status | `pending?` |
   |--------|---------|
   | `:job/failure` | N |
   | `:job/success` | N |
   | `:job/pending` | Y |
  "
  [job]
  (node/pending? (zip/node job)))

(defn eligible?
  "Predicate to test for pending completion of a (sub)job.
   Here is the per-status breakdown:

   | status | `eligible?` |
   |--------|---------|
   | `:job/failure` | N |
   | `:job/success` | N |
   | `:job/pending` | Y |
  "
  [job]
  (node/eligible? (zip/node job)))

(defn status
  "
  Get the job status from an ast.

  Status predicates breakdown:
  | status | `done?` | `failed?` | `eligible?` | `pending?` |
  |--------|---------|-----------|-------------|------------|
  | `:job/failure` | Y | Y | N | N |
  | `:job/success` | Y | N | N | N |
  | `:job/pending` | N | N | Y | Y |
  "
  [ast]
  (cond
    (pending? ast)  :job/pending
    (failed? ast)   :job/failure
    (done? ast)     :job/success
    (eligible? ast) :job/pending
    :else           (throw (ex-info "Wrong AST job state"
                                    {::ex/type ::ex/fault}))))

(defn prune
  "Remove empties :ast/nodes leaves"
  [ast]
  (loop [zipper (zip/next (ast-zip ast))]
    (if (zip/end? zipper)
      (zip/root zipper)
      (let [{:ast/keys [nodes]} (zip/node zipper)]
        (cond
          (and (some? nodes)
               (zip/path zipper)
               (empty? nodes))
          (recur (zip/remove zipper))

          :else
          (recur (zip/next zipper)))))))

(defn unzip
  "Get back to a data AST from a program's zipper"
  [zipper]
  (zip/root zipper))