forked from zero-one-group/geni
/
tuning.clj
36 lines (33 loc) · 1.41 KB
/
tuning.clj
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
(ns zero-one.geni.ml.tuning
(:require
[zero-one.geni.interop :as interop])
(:import
(org.apache.spark.ml.tuning CrossValidator
ParamGridBuilder
TrainValidationSplit)))
(defn param-grid [grids]
(let [builder (ParamGridBuilder.)]
(doall
(for [[stage grid-map] grids]
(doall
(for [[param-keyword grid] grid-map]
(.addGrid
builder
(interop/get-field stage param-keyword)
(interop/->scala-seq grid))))))
(.build builder)))
(defn cross-validator [{:keys [estimator evaluator estimator-param-maps num-folds seed parallelism]}]
(-> (CrossValidator.)
(cond-> estimator (.setEstimator estimator))
(cond-> evaluator (.setEvaluator evaluator))
(cond-> estimator-param-maps (.setEstimatorParamMaps estimator-param-maps))
(cond-> num-folds (.setNumFolds num-folds))
(cond-> seed (.setSeed seed))
(cond-> parallelism (.setParallelism parallelism))))
(defn train-validation-split [{:keys [estimator evaluator estimator-param-maps seed parallelism]}]
(-> (TrainValidationSplit.)
(cond-> estimator (.setEstimator estimator))
(cond-> evaluator (.setEvaluator evaluator))
(cond-> estimator-param-maps (.setEstimatorParamMaps estimator-param-maps))
(cond-> seed (.setSeed seed))
(cond-> parallelism (.setParallelism parallelism))))