src/learning_curves.jl

## LEARNING CURVES

"""
    curve = learning_curve(mach; resolution=30,
                                 resampling=Holdout(),
                                 repeats=1,
                                 measure=default_measure(machine.model),
                                 rows=nothing,
                                 weights=nothing,
                                 operation=nothing,
                                 range=nothing,
                                 acceleration=default_resource(),
                                 acceleration_grid=CPU1(),
                                 rngs=nothing,
                                 rng_name=nothing)

Given a supervised machine `mach`, returns a named tuple of objects
suitable for generating a plot of performance estimates, as a function
of the single hyperparameter specified in `range`. The tuple `curve`
has the following keys: `:parameter_name`, `:parameter_scale`,
`:parameter_values`, `:measurements`.

To generate multiple curves for a `model` with a random number
generator (RNG) as a hyperparameter, specify the name, `rng_name`, of
the (possibly nested) RNG field, and a vector `rngs` of RNG's, one for
each curve. Alternatively, set `rngs` to the number of curves desired,
in which case RNG's are automatically generated. The individual curve
computations can be distributed across multiple processes using
`acceleration=CPUProcesses()` or `acceleration=CPUThreads()`. See the
second example below for a demonstration.

```julia
X, y = @load_boston;
atom = @load RidgeRegressor pkg=MultivariateStats
ensemble = EnsembleModel(atom=atom, n=1000)
mach = machine(ensemble, X, y)
r_lambda = range(ensemble, :(atom.lambda), lower=10, upper=500, scale=:log10)
curve = learning_curve(mach; range=r_lambda, resampling=CV(), measure=mav)
using Plots
plot(curve.parameter_values,
     curve.measurements,
     xlab=curve.parameter_name,
     xscale=curve.parameter_scale,
     ylab = "CV estimate of RMS error")
```

If using a `Holdout()` `resampling` strategy (with no shuffling) and
if the specified hyperparameter is the number of iterations in some
iterative model (and that model has an appropriately overloaded
`MLJModelInterface.update` method) then training is not restarted from scratch
for each increment of the parameter, ie the model is trained
progressively.

```julia
atom.lambda=200
r_n = range(ensemble, :n, lower=1, upper=250)
curves = learning_curve(mach; range=r_n, verbosity=0, rng_name=:rng, rngs=3)
plot!(curves.parameter_values,
     curves.measurements,
     xlab=curves.parameter_name,
     ylab="Holdout estimate of RMS error")


```
    learning_curve(model::Supervised, X, y; kwargs...)
    learning_curve(model::Supervised, X, y, w; kwargs...)

Plot a learning curve (or curves) directly, without first constructing
a machine.

### Summary of key-word options

- `resolution` - number of points generated from `range` (number model
  evaluations); default is `30`

- `acceleration` - parallelization option for passing to `evaluate!`;
  an instance of `CPU1`, `CPUProcesses` or `CPUThreads` from the
  `ComputationalResources.jl`; default is `default_resource()`

- `acceleration_grid` - parallelization option for distributing each
  performancde evaluation

- `rngs` - for specifying random number generator(s) to be passed to
  the model (see above)

- `rng_name` - name of the model hyper-parameter representing a random
  number generator (see above); possibly nested

Other key-word options are documented at [`TunedModel`](@ref).

"""
learning_curve(mach::Machine{<:Supervised}; kwargs...) =
    learning_curve(mach.model, mach.args...; kwargs...)

function learning_curve(model::Supervised, args...;
                        resolution=30,
                        resampling=Holdout(),
                        weights=nothing,
                        measures=nothing,
                        measure=measures,
                        rows=nothing,
                        operation=nothing,
                        ranges::Union{Nothing,ParamRange}=nothing,
                        range::Union{Nothing,ParamRange},
                        repeats=1,
                        acceleration=default_resource(),
                        acceleration_grid=CPU1(),
                        verbosity=1,
                        rngs=nothing,
                        rng_name=nothing,
                        check_measure=true)

    range !== nothing || error("No param range specified. Use range=... ")

    if rngs != nothing
        rng_name == nothing &&
            error("Having specified `rngs=...`, you must specify "*
                  "`rng_name=...` also. ")
        if rngs isa Integer
            rngs = MersenneTwister.(1:rngs)
        elseif rngs isa AbstractRNG
            rngs = [rngs, ]
        elseif !(rngs isa AbstractVector{<:AbstractRNG})
            error("`rng` must have type `Integer` , `AbstractRNG` or "*
                  "`AbstractVector{<:AbstractRNG}`. ")
        end
    end

    if (acceleration isa CPUProcesses &&
        acceleration_grid isa CPUProcesses)
        message =
        "The combination acceleration=$(acceleration) and"*
        " acceleration_grid=$(acceleration_grid) is"*
        "  not generally optimal. You may want to consider setting"*
        " `acceleration = CPUProcesses()` and"*
        " `acceleration_grid = CPUThreads()`."
       @warn message
     end
    if (acceleration isa CPUThreads &&
        acceleration_grid isa CPUProcesses)
        message =
        "The combination acceleration=$(acceleration) and"*
        " acceleration_grid=$(acceleration_grid) isn't supported. \n"*
        "Resetting to"*
        " `acceleration = CPUProcesses()` and"*
        " `acceleration_grid = CPUThreads()`."
        @warn message
        acceleration = CPUProcesses()
        acceleration_grid = CPUThreads()
     end
   _acceleration = _process_accel_settings(acceleration)
    tuned_model = TunedModel(model=model,
                             range=range,
                             tuning=Grid(resolution=resolution,
                                         shuffle=false),
                             resampling=resampling,
                             operation=operation,
                             measure=measure,
                             train_best=false,
                             weights=weights,
                             repeats=repeats,
                             acceleration=acceleration_grid)

    tuned = machine(tuned_model, args...)

    results =
        _tuning_results(rngs, _acceleration, tuned, rows, rng_name, verbosity)

    parameter_name=results.parameter_names[1]
    parameter_scale=results.parameter_scales[1]
    parameter_values=[results.parameter_values[:, 1]...]
    measurements = results.measurements

    return (parameter_name=parameter_name,
            parameter_scale=parameter_scale,
            parameter_values=parameter_values,
            measurements=measurements)
end

_collate(plotting1, plotting2) =
    merge(plotting1,
          (measurements=hcat(plotting1.measurements,
                             plotting2.measurements),))

# fallback:
#_tuning_results(rngs, acceleration, tuned, rows, rngs_name, verbosity) =
#    error("acceleration=$acceleration unsupported. ")

# single curve:
_tuning_results(rngs::Nothing,
                acceleration,
                tuned,
                rows,
                rngs_name,
                verbosity) = _single_curve(tuned, rows, verbosity)

function _single_curve(tuned, rows, verbosity)
    fit!(tuned, rows=rows, verbosity=verbosity, force=true)
    report(tuned).plotting
end

# CPU1:
function _tuning_results(rngs::AbstractVector,
                         acceleration::CPU1,
                         tuned,
                         rows,
                         rng_name,
                         verbosity)

    old_rng = recursive_getproperty(tuned.model.model, rng_name)
    n_rngs = length(rngs)

    p = Progress(n_rngs,
         dt = 0,
         desc = "Evaluating Learning curve with $(n_rngs) rngs: ",
         barglyphs = BarGlyphs("[=> ]"),
         barlen = 18,
         color = :yellow)

    verbosity < 1 ||  update!(p,0)

    ret = mapreduce(_collate, rngs) do rng
              recursive_setproperty!(tuned.model.model, rng_name, rng)
              fit!(tuned, rows=rows, verbosity=verbosity-1, force=true)
              r =report(tuned).plotting
              verbosity < 1 || begin
                      p.counter += 1
                      ProgressMeter.updateProgress!(p)
                    end
              r
         end

    recursive_setproperty!(tuned.model.model, rng_name, old_rng)

    return ret
end

# CPUProcesses:
function _tuning_results(rngs::AbstractVector,
                         acceleration::CPUProcesses,
                         tuned,
                         rows,
                         rng_name,
                         verbosity)

    old_rng = recursive_getproperty(tuned.model.model, rng_name)
    n_rngs = length(rngs)

    ret = @sync begin

    p = Progress(n_rngs,
         dt = 0,
         desc = "Evaluating Learning curve with $(n_rngs) rngs: ",
         barglyphs = BarGlyphs("[=> ]"),
         barlen = 18,
         color = :yellow)

    channel = RemoteChannel(()->Channel{Bool}(min(1000, n_rngs)), 1)

    # printing the progress bar
    verbosity < 1 || begin
                update!(p,0)
                @async while take!(channel)
                    p.counter +=1
                    ProgressMeter.updateProgress!(p)
                end
             end

    ret_ = @distributed (_collate) for rng in rngs
            recursive_setproperty!(tuned.model.model, rng_name, rng)
            fit!(tuned, rows=rows, verbosity=verbosity-1, force=true)
            r=report(tuned).plotting
            verbosity < 1 || put!(channel, true)
            r
        end

     verbosity < 1 || put!(channel, false)
     ret_
 end
    recursive_setproperty!(tuned.model.model, rng_name, old_rng)
    return ret
end

# CPUThreads:
@static if VERSION >= v"1.3.0-DEV.573"
    function _tuning_results(rngs::AbstractVector,
                             acceleration::CPUThreads,
                             tuned,
                             rows,
                             rng_name,
                             verbosity)

    n_threads = Threads.nthreads()
    if n_threads == 1
        return _tuning_results(rngs,
                               CPU1(),
                               tuned,
                               rows,
                               rng_name,
                               verbosity)
    end

    old_rng = recursive_getproperty(tuned.model.model, rng_name)
    n_rngs = length(rngs)
    ntasks = acceleration.settings
    partitions = MLJBase.chunks(1:n_rngs, ntasks)

     p = Progress(n_rngs,
         dt = 0,
         desc = "Evaluating Learning curve with $(n_rngs) rngs: ",
         barglyphs = BarGlyphs("[=> ]"),
         barlen = 18,
         color = :yellow)

    ch = Channel{Bool}(length(partitions))

    ret_ = Vector(undef, length(partitions))

    @sync begin
        verbosity < 1 || begin
                          update!(p,0)
                          @async while take!(ch)
                            p.counter +=1
                            ProgressMeter.updateProgress!(p)
                          end
                        end

        # One t_tuned per task
        ## deepcopy of model is because other threads can still change the state
        ## of tuned.model.model
        tmachs = [tuned,
                  [machine(TunedModel(model = deepcopy(tuned.model.model),
                                      range=deepcopy(tuned.model.range),
                                      tuning=tuned.model.tuning,
                                      resampling=tuned.model.resampling,
                                      operation=tuned.model.operation,
                                      measure=tuned.model.measure,
                                      train_best=tuned.model.train_best,
                                      weights=tuned.model.weights,
                                      repeats=tuned.model.repeats,
                                      acceleration=tuned.model.acceleration),
                           tuned.args...) for _ in 2:length(partitions)]...]
        @sync for (i,rng_part) in enumerate(partitions)
            Threads.@spawn begin
                ret_[i] = mapreduce(_collate, rng_part) do k
                    recursive_setproperty!(tmachs[i].model.model,
                                           rng_name, rngs[k])
                    fit!(tmachs[i], rows=rows,
                         verbosity=verbosity-1, force=true)
                    verbosity < 1 || put!(ch, true)
                    report(tmachs[i]).plotting
                end
            end
        end
        verbosity < 1 || put!(ch, false)
    end

        ret =  reduce(_collate, ret_)
        recursive_setproperty!(tuned.model.model, rng_name, old_rng)
        return ret
    end

end