unit8co · dennisbader · Jun 5, 2022 · Apr 13, 2022 · Apr 23, 2022 · May 19, 2022
@@ -167,7 +167,7 @@ def ts_transform(
         )
         return series.with_values(
             BoxCox._reshape_out(series, transformed_vals, component_mask=component_mask)
-        )
+        ).set_static_covariates(series.static_covariates)
 
     @staticmethod
     def ts_inverse_transform(
@@ -185,7 +185,7 @@ def ts_inverse_transform(
             BoxCox._reshape_out(
                 series, inv_transformed_vals, component_mask=component_mask
             )
-        )
+        ).set_static_covariates(series.static_covariates)
 
     def fit(
         self, series: Union[TimeSeries, Sequence[TimeSeries]], **kwargs

@@ -106,7 +106,7 @@ def ts_transform(series: TimeSeries, transformer, **kwargs) -> TimeSeries:
             values=transformed_vals,
             fill_missing_dates=False,
             columns=series.columns,
-        )
+        ).set_static_covariates(series.static_covariates)
 
     @staticmethod
     def ts_inverse_transform(
@@ -126,7 +126,7 @@ def ts_inverse_transform(
             values=inv_transformed_vals,
             fill_missing_dates=False,
             columns=series.columns,
-        )
+        ).set_static_covariates(series.static_covariates)
 
     @staticmethod
     def ts_fit(series: TimeSeries, transformer, *args, **kwargs) -> Any:

@@ -342,7 +342,16 @@ def epochs_trained(self):
 
 class PLPastCovariatesModule(PLForecastingModule, ABC):
     def _produce_train_output(self, input_batch: Tuple):
-        past_target, past_covariate = input_batch
+        """
+        Feeds PastCovariatesTorchModel with input and output chunks of a PastCovariatesSequentialDataset for
+        training.
+
+        Parameters:
+        ----------
+        input_batch
+            ``(past_target, past_covariates, static_covariates)``
+        """
+        past_target, past_covariate, _ = input_batch
         # Currently all our PastCovariates models require past target and covariates concatenated
         inpt = (
             torch.cat([past_target, past_covariate], dim=2)
@@ -363,13 +372,13 @@ def _get_batch_prediction(
         n
             prediction length
         input_batch
-            (past_target, past_covariates, future_past_covariates)
+            ``(past_target, past_covariates, future_past_covariates, static_covariates)``
         roll_size
             roll input arrays after every sequence by ``roll_size``. Initially, ``roll_size`` is equivalent to
             ``self.output_chunk_length``
         """
         dim_component = 2
-        past_target, past_covariates, future_past_covariates = input_batch
+        past_target, past_covariates, future_past_covariates, _ = input_batch
 
         n_targets = past_target.shape[dim_component]
         n_past_covs = (
@@ -462,63 +471,56 @@ class PLMixedCovariatesModule(PLForecastingModule, ABC):
     def _produce_train_output(
         self, input_batch: Tuple
     ) -> Tuple[torch.Tensor, torch.Tensor]:
+        """
+        Feeds MixedCovariatesTorchModel with input and output chunks of a MixedCovariatesSequentialDataset for
+        training.
+
+        Parameters:
+        ----------
+        input_batch
+            ``(past_target, past_covariates, historic_future_covariates, future_covariates, static_covariates)``.
+        """
         return self(self._process_input_batch(input_batch))
 
     def _process_input_batch(
         self, input_batch
-    ) -> Tuple[torch.Tensor, Optional[torch.Tensor]]:
+    ) -> Tuple[torch.Tensor, Optional[torch.Tensor], Optional[torch.Tensor]]:
         """
         Converts output of MixedCovariatesDataset (training dataset) into an input/past- and
         output/future chunk.
 
         Parameters
         ----------
         input_batch
-            ``(past_target, past_covariates, historic_future_covariates, future_covariates)``.
+            ``(past_target, past_covariates, historic_future_covariates, future_covariates, static_covariates)``.
 
         Returns
         -------
         tuple
-            ``(x_past, x_future)`` the input/past and output/future chunks.
+            ``(x_past, x_future, x_static)`` the input/past and output/future chunks.
         """
-
         (
             past_target,
             past_covariates,
             historic_future_covariates,
             future_covariates,
+            static_covariates,
         ) = input_batch
         dim_variable = 2
 
-        # TODO: impelement static covariates
-        static_covariates = None
-
         x_past = torch.cat(
             [
                 tensor
                 for tensor in [
                     past_target,
                     past_covariates,
                     historic_future_covariates,
-                    static_covariates,
                 ]
                 if tensor is not None
             ],
             dim=dim_variable,
         )
-
-        x_future = None
-        if future_covariates is not None or static_covariates is not None:
-            x_future = torch.cat(
-                [
-                    tensor
-                    for tensor in [future_covariates, static_covariates]
-                    if tensor is not None
-                ],
-                dim=dim_variable,
-            )
-
-        return x_past, x_future
+        return x_past, future_covariates, static_covariates
 
     def _get_batch_prediction(
         self, n: int, input_batch: Tuple, roll_size: int
@@ -545,6 +547,7 @@ def _get_batch_prediction(
             historic_future_covariates,
             future_covariates,
             future_past_covariates,
+            static_covariates,
         ) = input_batch
 
         n_targets = past_target.shape[dim_component]
@@ -557,18 +560,19 @@ def _get_batch_prediction(
             else 0
         )
 
-        input_past, input_future = self._process_input_batch(
+        input_past, input_future, input_static = self._process_input_batch(
             (
                 past_target,
                 past_covariates,
                 historic_future_covariates,
                 future_covariates[:, :roll_size, :]
                 if future_covariates is not None
                 else None,
+                static_covariates,
             )
         )
 
-        out = self._produce_predict_output(x=(input_past, input_future))[
+        out = self._produce_predict_output(x=(input_past, input_future, input_static))[
             :, self.first_prediction_index :, :
         ]
 
@@ -636,9 +640,9 @@ def _get_batch_prediction(
                 input_future = future_covariates[:, left_future:right_future, :]
 
             # take only last part of the output sequence where needed
-            out = self._produce_predict_output(x=(input_past, input_future))[
-                :, self.first_prediction_index :, :
-            ]
+            out = self._produce_predict_output(
+                x=(input_past, input_future, input_static)
+            )[:, self.first_prediction_index :, :]
 
             batch_prediction.append(out)
             prediction_length += self.output_chunk_length

@@ -103,7 +103,7 @@ def forward(self, x, h=None):
         return predictions, last_hidden_state
 
     def _produce_train_output(self, input_batch: Tuple):
-        past_target, historic_future_covariates, future_covariates = input_batch
+        past_target, historic_future_covariates, future_covariates, _ = input_batch
         # For the RNN we concatenate the past_target with the future_covariates
         # (they have the same length because we enforce a Shift dataset for RNNs)
         model_input = (
@@ -127,7 +127,7 @@ def _get_batch_prediction(
         """
         This model is recurrent, so we have to write a specific way to obtain the time series forecasts of length n.
         """
-        past_target, historic_future_covariates, future_covariates = input_batch
+        past_target, historic_future_covariates, future_covariates, _ = input_batch
 
         if historic_future_covariates is not None:
             # RNNs need as inputs (target[t] and covariates[t+1]) so here we shift the covariates

@@ -31,7 +31,7 @@
 logger = get_logger(__name__)
 
 MixedCovariatesTrainTensorType = Tuple[
-    torch.Tensor, torch.Tensor, torch.Tensor, torch.Tensor, torch.Tensor
+    torch.Tensor, torch.Tensor, torch.Tensor, torch.Tensor, torch.Tensor, torch.Tensor
 ]
 
 
@@ -331,26 +331,25 @@ def get_attention_mask_future(
         )
         return mask
 
-    def forward(self, x: Tuple[torch.Tensor, Optional[torch.Tensor]]) -> torch.Tensor:
+    def forward(
+        self, x: Tuple[torch.Tensor, Optional[torch.Tensor], Optional[torch.Tensor]]
+    ) -> torch.Tensor:
         """TFT model forward pass.
 
         Parameters
         ----------
         x
-            comes as tuple `(x_past, x_future)` where `x_past` is the input/past chunk and `x_future`
+            comes as tuple `(x_past, x_future, x_static)` where `x_past` is the input/past chunk and `x_future`
             is the output/future chunk. Input dimensions are `(n_samples, n_time_steps, n_variables)`
 
         Returns
         -------
         torch.Tensor
             the output tensor
         """
-        x_cont_past, x_cont_future = x
+        x_cont_past, x_cont_future, x_static = x
         dim_samples, dim_time, dim_variable = 0, 1, 2
 
-        # TODO: impelement static covariates
-        static_covariates = None
-
         batch_size = x_cont_past.shape[dim_samples]
         encoder_length = self.input_chunk_length
         decoder_length = self.output_chunk_length
@@ -411,27 +410,21 @@ def forward(self, x: Tuple[torch.Tensor, Optional[torch.Tensor]]) -> torch.Tenso
         }
 
         # Embedding and variable selection
-        if static_covariates is not None:
-            # TODO: impelement static covariates
-            # # static embeddings will be constant over entire batch
-            # static_embedding = {name: input_vectors[name][:, 0] for name in self.static_variables}
-            # static_embedding, static_covariate_var = self.static_covariates_vsn(static_embedding)
-            raise NotImplementedError("Static covariates have yet to be defined")
+        if self.static_variables:
+            static_embedding = {
+                name: x_static[:, 0, i].unsqueeze(-1)
+                for i, name in enumerate(self.static_variables)
+            }
+            static_embedding, static_covariate_var = self.static_covariates_vsn(
+                static_embedding
+            )
         else:
             static_embedding = torch.zeros(
                 (x_cont_past.shape[0], self.hidden_size),
                 dtype=x_cont_past.dtype,
                 device=self.device,
             )
 
-            # # TODO: implement below when static covariates are supported
-            # # this is only to interpret the output
-            # static_covariate_var = torch.zeros(
-            #     (x_cont_past.shape[0], 0),
-            #     dtype=x_cont_past.dtype,
-            #     device=x_cont_past.device,
-            # )
-
         static_context_expanded = self.expand_static_context(
             context=self.static_context_grn(static_embedding), time_steps=time_steps
         )
@@ -751,7 +744,8 @@ def __init__(
     def _create_model(self, train_sample: MixedCovariatesTrainTensorType) -> nn.Module:
         """
         `train_sample` contains the following tensors:
-            (past_target, past_covariates, historic_future_covariates, future_covariates, future_target)
+            (past_target, past_covariates, historic_future_covariates, future_covariates, static_covariates,
+            future_target)
 
             each tensor has shape (n_timesteps, n_variables)
             - past/historic tensors have shape (input_chunk_length, n_variables)
@@ -771,6 +765,7 @@ def _create_model(self, train_sample: MixedCovariatesTrainTensorType) -> nn.Modu
             past_covariate,
             historic_future_covariate,
             future_covariate,
+            static_covariates,
             future_target,
         ) = train_sample
 
@@ -797,8 +792,6 @@ def _create_model(self, train_sample: MixedCovariatesTrainTensorType) -> nn.Modu
                 axis=1,
             )
 
-        static_covariates = None  # placeholder for future
-
         self.output_dim = (
             (future_target.shape[1], 1)
             if self.likelihood is None

@@ -20,7 +20,7 @@
 '
 """
 
-from typing import Dict, List, Tuple, Union
+from typing import Dict, List, Optional, Tuple, Union
 
 import torch
 import torch.nn as nn
@@ -378,17 +378,25 @@ def __init__(
         self,
         input_sizes: Dict[str, int],
         hidden_size: int,
-        input_embedding_flags: Dict[str, bool] = {},
+        input_embedding_flags: Optional[Dict[str, bool]] = None,
         dropout: float = 0.1,
         context_size: int = None,
-        single_variable_grns: Dict[str, _GatedResidualNetwork] = {},
-        prescalers: Dict[str, nn.Linear] = {},
+        single_variable_grns: Optional[Dict[str, _GatedResidualNetwork]] = None,
+        prescalers: Optional[Dict[str, nn.Linear]] = None,
     ):
         """
         Calcualte weights for ``num_inputs`` variables  which are each of size ``input_size``
         """
         super().__init__()
 
+        input_embedding_flags = (
+            input_embedding_flags if input_embedding_flags is not None else {}
+        )
+        single_variable_grns = (
+            single_variable_grns if single_variable_grns is not None else {}
+        )
+        prescalers = prescalers if prescalers is not None else {}
+
         self.hidden_size = hidden_size
         self.input_sizes = input_sizes
         self.input_embedding_flags = input_embedding_flags