FluxML · lorenzoh · Jul 29, 2022 · Jun 18, 2022 · Jun 22, 2022 · Jun 23, 2022
diff --git a/src/FastAI.jl b/src/FastAI.jl
@@ -109,6 +109,9 @@ include("Tabular/Tabular.jl")
 include("Textual/Textual.jl")
 @reexport using .Textual
 
+include("TimeSeries/TimeSeries.jl")
+@reexport using .TimeSeries
+
 include("deprecations.jl")
 export
     methodmodel,
@@ -168,6 +171,7 @@ export
     Continuous,
     Image,
     Paragraph,
+    TimeSeriesRow,
 
     # encodings
     encode,

diff --git a/src/TimeSeries/TimeSeries.jl b/src/TimeSeries/TimeSeries.jl
@@ -0,0 +1,52 @@
+module TimeSeries
+
+
+using ..FastAI
+using ..FastAI:
+    # blocks
+    Block, WrapperBlock, AbstractBlock, OneHotTensor, OneHotTensorMulti, Label,
+    LabelMulti, wrapped, Continuous, getencodings, getblocks, encodetarget, encodeinput,
+    # encodings
+    Encoding, StatefulEncoding, OneHot,
+    # visualization
+    ShowText,
+    # other
+    Context, Training, Validation
+import ..FastAI: Datasets
+using ..FastAI.Datasets
+# for tests
+using ..FastAI: testencoding
+
+# extending
+import ..FastAI:
+    blockmodel, blockbackbone, blocklossfn, encode, decode, checkblock,
+    encodedblock, decodedblock, showblock!, mockblock, setup
+
+import MLUtils: MLUtils, eachobs, getobs, numobs
+import Requires: @require
+
+using FilePathsBase
+using InlineTest
+
+# Blocks
+include("blocks/timeseriesrow.jl")
+
+include("encodings/timeseriespreprocessing.jl");
+
+const _tasks = Dict{String, Any}()
+include("tasks/classification.jl")
+
+include("recipes.jl")
+
+function __init__()
+    _registerrecipes()
+    foreach(values(_tasks)) do t
+        if !haskey(FastAI.learningtasks(), t.id)
+            push!(FastAI.learningtasks(), t)
+        end
+    end
+end
+
+export 
+    TimeSeriesRow, TSClassificationSingle, TimeSeriesPreprocessing
-export 
-    TimeSeriesRow, TSClassificationSingle, TimeSeriesPreprocessing
+export 
+    TimeSeriesRow, TSClassificationSingle, TSPreprocessing
-export 
-    TimeSeriesRow, TSClassificationSingle, TimeSeriesPreprocessing
+export 
+    TimeSeriesRow, TSClassificationSingle, TSPreprocessing
+end
diff --git a/src/TimeSeries/blocks/timeseriesrow.jl b/src/TimeSeries/blocks/timeseriesrow.jl
@@ -0,0 +1,42 @@
+"""
+    TimeSeriesRow{M,N}() <: Block
+
+[`Block`](#) for a M variate time series with N number of time steps. `obs` is valid for `TimeSeriesRow{M,N}()`
+if it is an (M,N) dimensional Matrix with number element type.
+
+## Examples
+
+Creating a block:
+
+```julia
+TimeSeriesRow{1,51}()  # Univariate time series with length 51.
+TimeSeriesRow{2,51}()  # Multivariate time series with 2 variables and length 51.
+```
+
+You can create a random observation using [`mockblock`](#):
+
+{cell=main}
+```julia
+using FastAI
+FastAI.mockblock(TimeSeriesRow{1,10}())
+```
+
+"""
+
+struct TimeSeriesRow <: Block 
+    nfeatures::Int
+    obslength::Union{Int, Colon}
+end
+
+function checkblock(row::TimeSeriesRow, obs::AbstractArray{T,2}) where {T<:Number}
+    size(obs) == (row.nfeatures, row.obslength)
+end
+
+function mockblock(row::TimeSeriesRow)
+    rand(Float64, (row.nfeatures, row.obslength))
+end
+
+function setup(::Type{TimeSeriesRow}, data)
+    nfeatures, obslength = size(getindex(data, 1))
+    return TimeSeriesRow(nfeatures, obslength)
+end
diff --git a/src/TimeSeries/encodings/timeseriespreprocessing.jl b/src/TimeSeries/encodings/timeseriespreprocessing.jl
@@ -0,0 +1,51 @@
+"""
+    TSPreprocessing() <: Encoding
+
+Encodes 'TimeSeriesRow's by normalizing the time-series values. The time-series can
+either be normalized by each variable or time-step.
+
+Encodes
+- 'TimeSeriesRow' -> 'TimeSeriesRow'
+"""
+
+struct TSPreprocessing <: Encoding
+    tfms
+end
+
+function TSPreprocessing()
+    base_tfms = [
+    ]
+    return TSPreprocessing(base_tfms)
+end
+
+function encodedblock(p::TSPreprocessing, block::TimeSeriesRow)
+    return block
+end
+
+function encode(p::TSPreprocessing, context, block::TimeSeriesRow, obs)
+    for tfm in values(p.tfms)
+        obs = tfm(obs)
+    end
+    obs
+end
+
+function tsdatasetstats(
+    data;
+    by_var=false,
+    by_step=false
+)
+    drop_axes = []
+    if (by_var)
+        append!(drop_axes,2)
+    else
+        append!(drop_axes,3)
+    end 
+    axes = [ax for ax in [1, 2, 3] if !(ax in drop_axes)]
+    mean = Statistics.mean(data, dims=axes)
+    std  = Statistics.std(data, dims=axes)
+    return mean, std
+end
+
+function setup(::Type{TSPreprocessing}, ::TimeSeriesRow, data)
+    means, stds = tsdatasetstats(data)
+end
-function setup(::Type{TSPreprocessing}, ::TimeSeriesRow, data)
-    means, stds = tsdatasetstats(data)
-end
+setup(::Type{TSPreprocessing}, ::TimeSeriesRow, data) = means, stds = tsdatasetstats(data)
-function setup(::Type{TSPreprocessing}, ::TimeSeriesRow, data)
-    means, stds = tsdatasetstats(data)
-end
+setup(::Type{TSPreprocessing}, ::TimeSeriesRow, data) = means, stds = tsdatasetstats(data)
diff --git a/src/TimeSeries/makie.jl b/src/TimeSeries/makie.jl
diff --git a/src/TimeSeries/recipes.jl b/src/TimeSeries/recipes.jl
@@ -0,0 +1,63 @@
+"""
+    TimeSeriesDatasetRecipe(file; loadfn = loadfile)
+
+Recipe for loading a time series dataset stored in a .ts file
+
+"""
+Base.@kwdef struct TimeSeriesDatasetRecipe <: Datasets.DatasetRecipe
+    train_file
+    test_file = nothing
+    loadfn = Datasets.loadfile
+end
+
+Datasets.recipeblocks(::Type{TimeSeriesDatasetRecipe}) = Tuple{TimeSeriesRow, Label} 
+
+#TODO: Add Check if test_file is nothing.
+function Datasets.loadrecipe(recipe::TimeSeriesDatasetRecipe, path)
+    path = convert(String, path)
+    datasetpath_train = joinpath(path, recipe.train_file)
+    rows_train, labels_train = recipe.loadfn(datasetpath_train)
+    datasetpath_test = joinpath(path, recipe.test_file)
+    rows_test, labels_test = recipe.loadfn(datasetpath_test)
+    rows = [rows_train; rows_test]
+    labels = [labels_train; labels_test]
+    rows = TimeSeriesDataset(rows)
+    data = rows, labels
+    blocks = (
+        setup(TimeSeriesRow,rows),
+        Label(unique(eachobs(labels))),
+    )
+    return data, blocks
+end
+
+# Registering recipes
+
+const RECIPES = Dict{String,Vector{Datasets.DatasetRecipe}}(
+    "ecg5000" => [
+        TimeSeriesDatasetRecipe(train_file="ECG5000_TRAIN.ts", test_file="ECG5000_TEST.ts")
+    ],
+)
+
+function _registerrecipes()
+    for (name, recipes) in RECIPES, recipe in recipes
+        if !haskey(datarecipes(), name)
+            push!(datarecipes(), (
+                id = name,
+                datasetid = name,
+                blocks = Datasets.recipeblocks(recipe),
+                package = @__MODULE__,
+                recipe = recipe,
+            ))
+        end
+    end
+end
+
+# ## Tests
+
+@testset "TimeSeriesDataset [recipe]" begin
+    path = datasetpath("ecg5000")
+    recipe = TimeSeriesDatasetRecipe(train_file="ECG5000_TRAIN.ts", test_file="ECG5000_TEST.ts")
+    data, block = loadrecipe(recipe, path)
+    sample = getobs(data, 1)
+    @test checkblock(block, sample)
+end
diff --git a/src/TimeSeries/tasks/classification.jl b/src/TimeSeries/tasks/classification.jl
@@ -0,0 +1,29 @@
+"""
+    TSClassificationSingle(blocks[, data])
+Learning task for single-label time-series classification. Samples are normalized and 
+classified into of the 'classes'.
+"""
+function TSClassificationSingle(
+    blocks::Tuple{<:TimeSeriesRow, <:Label},
+    data
+)
+    return SupervisedTask(
+        blocks,
+        (
+            OneHot()
+        )
+    )
+end
+
+_tasks["tsclfsingle"] = (
+    id = "timeseries/single",
+    name = "Time-Series Classification (single-label)",
+    constructor = TSClassificationSingle,
+    blocks = (TimeSeriesRow, Label),
+    category = "supervised",
+    description = """
+        Time-Series classification task where every time-series has a single 
+        class label associated with it.
+        """,
+    package = @__MODULE__,
+)
diff --git a/src/datasets/Datasets.jl b/src/datasets/Datasets.jl
@@ -38,12 +38,14 @@ end
 export
     # primitive containers
     TableDataset,
+    TimeSeriesDataset,
 
     mapobs, eachobs, groupobs, shuffleobs, ObsView,
 
     # utilities
     isimagefile,
     istextfile,
+    istimeseriesfile,
     matches,
     loadfile,
     loadmask,