In [1]:
import os
import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
import lightgbm as lgb
from statsmodels.tsa.stattools import adfuller
from sktime.forecasting.model_selection import temporal_train_test_split
from sktime.transformations.series.summarize import WindowSummarizer
from sktime.forecasting.compose import make_reduction
from sklearn.model_selection import GridSearchCV, TimeSeriesSplit
from sklearn.pipeline import Pipeline
from sklearn.metrics import mean_squared_error

Dask dataframe query planning is disabled because dask-expr is not installed.

You can install it with `pip install dask[dataframe]` or `conda install dask`.
This will raise in a future version.



In [2]:
data = pd.read_csv("../data/HMIS_DATA_CORRECTED_17_21/mh_dist17_21_with_IDs_date_correction.csv")
data = data[(data['indicator_type'] == 'Total [(A+B) or (C+D)]')]
data['date'] = pd.to_datetime(data['date'])
data = data.set_index('date')
data.index = pd.DatetimeIndex(data.index)

In [3]:
def lightgbm_forecast_lags(series, district_name, 
                          max_lags=6, 
                          window_features=None,
                          differencing=True,
                          use_cv=True,
                          custom_params=None):
    """
    LightGBM time series forecasting with proper temporal validation
    """
    # Create output directory
    os.makedirs('LightGBM_Forecasts', exist_ok=True)
    
    # 1. Stationarity handling
    original_series = series.copy()
    d = 0
    if differencing:
        adf_result = adfuller(series.dropna())
        if adf_result[1] > 0.05:
            d = 1
            series = series.diff().dropna()

    # 2. Temporal split using sktime's proper method
    y_train, y_test = temporal_train_test_split(series, test_size=0.2)

    # 3. Create feature engineering pipeline
    features = []
    if max_lags > 0:
        features.append(("lags", WindowSummarizer(
            lag_feature={"lag": list(range(1, max_lags+1))},
            truncate="bfill"
        )))
    
    if window_features:
        features.append(("window", WindowSummarizer(
            lag_feature={
                "mean": [[1, window_features['mean_window']]],
                "std": [[1, window_features['std_window']]]
            },
            truncate="bfill"
        )))

    # 4. LightGBM regressor setup
    regressor = lgb.LGBMRegressor(
        **custom_params or {
            'objective': 'regression',
            'metric': 'rmse',
            'num_leaves': 31,
            'learning_rate': 0.05,
            'n_estimators': 500,
            'random_state': 42
        }
    )
    
    # 5. Create forecasting pipeline
    forecaster = make_reduction(
        estimator=Pipeline([
            ("features", Pipeline(features)),
            ("regressor", regressor)
        ]),
        window_length=max_lags,
        strategy="recursive"
    )

    # 6. Hyperparameter tuning with temporal CV
    if use_cv:
        param_grid = {
            'estimator__regressor__num_leaves': [15, 31, 63],
            'estimator__regressor__learning_rate': [0.01, 0.05, 0.1],
            'estimator__regressor__min_child_samples': [10, 20, 50]
        }
        
        forecaster = GridSearchCV(
            forecaster,
            param_grid,
            cv=TimeSeriesSplit(n_splits=5),
            scoring='neg_mean_squared_error',
            n_jobs=-1
        )

    # 7. Training
    forecaster.fit(y_train)
    
    # 8. Forecasting
    fh = np.arange(len(y_test)) + 1  # Forecast horizon
    y_pred = forecaster.predict(fh)
    
    # 9. Inverse differencing
    if d == 1:
        last_train_value = original_series.iloc[-len(y_test)-1]
        y_pred = pd.Series(np.cumsum(y_pred) + last_train_value, index=y_test.index)
        y_test = original_series.iloc[-len(y_test):]

    # 10. Create results dataframe
    forecast_df = pd.DataFrame({
        'district': district_name,
        'date': y_test.index,
        'actual': y_test.values,
        'forecast': y_pred.values
    })

    # 11. Save results
    forecast_df.to_csv(
        f'LightGBM_Forecasts/{district_name}_forecast.csv',
        index=False
    )

    # 12. Calculate metrics
    rmse = np.sqrt(mean_squared_error(y_test, y_pred))
    metrics = {
        'district': district_name,
        'rmse': rmse,
        'best_params': getattr(forecaster, 'best_params_', None),
        'differencing': d
    }

    # 13. Visualization
    plt.figure(figsize=(14, 7))
    plt.plot(original_series.index, original_series, label='Original')
    plt.plot(forecast_df['date'], forecast_df['forecast'], 
            label='LightGBM Forecast', alpha=0.7)
    plt.title(f'{district_name} Forecast\nRMSE: {rmse:.2f}')
    plt.legend()
    plt.savefig(f'LightGBM_Forecasts/{district_name}_forecast_plot.png')
    plt.close()

    return metrics, forecast_df

In [4]:
districts = data['district'].unique()
rmse_values = []

# Usage Example


def run_for_each_district():
    results = {}
    
    for district in districts:
        district_data = data[data['district'] == district]
        ts = district_data["I8"].asfreq('MS')
        
        results, forecast = lightgbm_forecast_lags(
        series=ts,
        district_name=district,
        max_lags=6,
        window_features={'mean_window': 3, 'std_window': 6},
        custom_params={
            'num_leaves': 63,
            'learning_rate': 0.1,
            'n_estimators': 1000
        }
    )

        
    
        # Show results
        print("=== Metrics ===")
        print(results)
        print("\n=== Forecast Data ===")
        print(forecast)
    
    return results
run_for_each_district()

27 fits failed out of a total of 135.
The score on these train-test partitions for these parameters will be set to nan.
If these failures are not expected, you can try to debug them by setting error_score='raise'.

Below are more details about the failures:
--------------------------------------------------------------------------------
27 fits failed with the following error:
Traceback (most recent call last):
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sklearn\model_selection\_validation.py", line 893, in _fit_and_score
    estimator.fit(X_train, **fit_params)
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sktime\forecasting\base\_base.py", line 396, in fit
    self._fit(y=y_inner, X=X_inner, fh=fh)
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sktime\forecasting\compose\_reduce.py", line 972, in _fit
    self.estimator_.fit(Xt, yt)
  File "c:\Users\nauti\AppData\Local\Programs\P

[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000089 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 137
[LightGBM] [Info] Number of data points in the train set: 31, number of used features: 12
[LightGBM] [Info] Start training from score 130.645161
=== Metrics ===
{'district': 'AHMEDNAGAR', 'rmse': 1891.102136102216, 'best_params': {'estimator__regressor__learning_rate': 0.01, 'estimator__regressor__min_child_samples': 10, 'estimator__regressor__num_leaves': 15}, 'differencing': 1}

=== Forecast Data ===
     district       date  actual     forecast
0  AHMEDNAGAR 2020-06-01    6372  7561.311518
1  AHMEDNAGAR 2020-07-01    5982  7477.171827
2  AHMEDNAGAR 2020-08-01    5559  7527.606727
3  AHMEDNAGAR 2020-09-01    5903  7849.690512
4  AHMEDNAGAR 2020-10-01    5719  7580.421046
5  AHMEDNAGAR 2020-11-01    5427  8040.702833
6  AHMEDNAGAR

27 fits failed out of a total of 135.
The score on these train-test partitions for these parameters will be set to nan.
If these failures are not expected, you can try to debug them by setting error_score='raise'.

Below are more details about the failures:
--------------------------------------------------------------------------------
27 fits failed with the following error:
Traceback (most recent call last):
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sklearn\model_selection\_validation.py", line 893, in _fit_and_score
    estimator.fit(X_train, **fit_params)
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sktime\forecasting\base\_base.py", line 396, in fit
    self._fit(y=y_inner, X=X_inner, fh=fh)
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sktime\forecasting\compose\_reduce.py", line 972, in _fit
    self.estimator_.fit(Xt, yt)
  File "c:\Users\nauti\AppData\Local\Programs\P

[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000281 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 136
[LightGBM] [Info] Number of data points in the train set: 31, number of used features: 12
[LightGBM] [Info] Start training from score 22.741935
=== Metrics ===
{'district': 'AKOLA', 'rmse': 390.7629421620926, 'best_params': {'estimator__regressor__learning_rate': 0.01, 'estimator__regressor__min_child_samples': 10, 'estimator__regressor__num_leaves': 15}, 'differencing': 1}

=== Forecast Data ===
  district       date  actual     forecast
0    AKOLA 2020-06-01    1575  1582.924882
1    AKOLA 2020-07-01    1555  1673.179839
2    AKOLA 2020-08-01    1523  1785.295007
3    AKOLA 2020-09-01    1606  1872.979681
4    AKOLA 2020-10-01    1395  1852.000782
5    AKOLA 2020-11-01    1204  1956.272621
6    AKOLA 2020-12-01    1630  1862.157986
7    AKOLA 2021-01-01    1745  2028.446317
8    AKOLA 2021-02

 nan nan nan nan nan nan nan nan nan]


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000232 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 140
[LightGBM] [Info] Number of data points in the train set: 32, number of used features: 12
[LightGBM] [Info] Start training from score 2161.968750
=== Metrics ===
{'district': 'AMRAVATI', 'rmse': 417.97253265393636, 'best_params': {'estimator__regressor__learning_rate': 0.01, 'estimator__regressor__min_child_samples': 10, 'estimator__regressor__num_leaves': 15}, 'differencing': 0}

=== Forecast Data ===
   district       date  actual     forecast
0  AMRAVATI 2020-06-01    2017  2390.798282
1  AMRAVATI 2020-07-01    1905  2390.798282
2  AMRAVATI 2020-08-01    1776  2390.798282
3  AMRAVATI 2020-09-01    1794  2390.798282
4  AMRAVATI 2020-10-01    1814  2390.798282
5  AMRAVATI 2020-11-01    1896  2390.798282
6  AMRAVATI 2020-12-01    2379  2390.798282
7  AMRAVATI 2021-01-01    2249  2390.798282
8  

27 fits failed out of a total of 135.
The score on these train-test partitions for these parameters will be set to nan.
If these failures are not expected, you can try to debug them by setting error_score='raise'.

Below are more details about the failures:
--------------------------------------------------------------------------------
27 fits failed with the following error:
Traceback (most recent call last):
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sklearn\model_selection\_validation.py", line 893, in _fit_and_score
    estimator.fit(X_train, **fit_params)
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sktime\forecasting\base\_base.py", line 396, in fit
    self._fit(y=y_inner, X=X_inner, fh=fh)
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sktime\forecasting\compose\_reduce.py", line 972, in _fit
    self.estimator_.fit(Xt, yt)
  File "c:\Users\nauti\AppData\Local\Programs\P

[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000223 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 136
[LightGBM] [Info] Number of data points in the train set: 31, number of used features: 12
[LightGBM] [Info] Start training from score 25.000000
=== Metrics ===
{'district': 'AURANGABAD', 'rmse': 895.1845486507957, 'best_params': {'estimator__regressor__learning_rate': 0.01, 'estimator__regressor__min_child_samples': 10, 'estimator__regressor__num_leaves': 15}, 'differencing': 1}

=== Forecast Data ===
     district       date  actual     forecast
0  AURANGABAD 2020-06-01    3456  3608.953492
1  AURANGABAD 2020-07-01    2897  3652.838648
2  AURANGABAD 2020-08-01    3107  3786.904338
3  AURANGABAD 2020-09-01    3639  3776.630729
4  AURANGABAD 2020-10-01    5000  3849.777135
5  AURANGABAD 2020-11-01    4498  3890.028980
6  AURANGABAD 2020-12-01    5448  3946.458423
7  AURANGABAD 2021-01-01    5221

27 fits failed out of a total of 135.
The score on these train-test partitions for these parameters will be set to nan.
If these failures are not expected, you can try to debug them by setting error_score='raise'.

Below are more details about the failures:
--------------------------------------------------------------------------------
27 fits failed with the following error:
Traceback (most recent call last):
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sklearn\model_selection\_validation.py", line 893, in _fit_and_score
    estimator.fit(X_train, **fit_params)
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sktime\forecasting\base\_base.py", line 396, in fit
    self._fit(y=y_inner, X=X_inner, fh=fh)
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sktime\forecasting\compose\_reduce.py", line 972, in _fit
    self.estimator_.fit(Xt, yt)
  File "c:\Users\nauti\AppData\Local\Programs\P

[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000077 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 134
[LightGBM] [Info] Number of data points in the train set: 31, number of used features: 12
[LightGBM] [Info] Start training from score 51.290323
=== Metrics ===
{'district': 'BEED', 'rmse': 743.6097200754442, 'best_params': {'estimator__regressor__learning_rate': 0.01, 'estimator__regressor__min_child_samples': 10, 'estimator__regressor__num_leaves': 15}, 'differencing': 1}

=== Forecast Data ===
  district       date  actual     forecast
0     BEED 2020-06-01    3448  3812.492359
1     BEED 2020-07-01    3407  3992.723217
2     BEED 2020-08-01    2907  4061.523713
3     BEED 2020-09-01    3136  4019.115390
4     BEED 2020-10-01    3117  4025.815516
5     BEED 2020-11-01    2842  3998.582664
6     BEED 2020-12-01    3110  3782.532955
7     BEED 2021-01-01    3208  3741.563465
8     BEED 2021-02-

27 fits failed out of a total of 135.
The score on these train-test partitions for these parameters will be set to nan.
If these failures are not expected, you can try to debug them by setting error_score='raise'.

Below are more details about the failures:
--------------------------------------------------------------------------------
27 fits failed with the following error:
Traceback (most recent call last):
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sklearn\model_selection\_validation.py", line 893, in _fit_and_score
    estimator.fit(X_train, **fit_params)
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sktime\forecasting\base\_base.py", line 396, in fit
    self._fit(y=y_inner, X=X_inner, fh=fh)
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sktime\forecasting\compose\_reduce.py", line 972, in _fit
    self.estimator_.fit(Xt, yt)
  File "c:\Users\nauti\AppData\Local\Programs\P

[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000222 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 137
[LightGBM] [Info] Number of data points in the train set: 31, number of used features: 12
[LightGBM] [Info] Start training from score 13.741935
=== Metrics ===
{'district': 'BHANDARA', 'rmse': 169.75854930616416, 'best_params': {'estimator__regressor__learning_rate': 0.01, 'estimator__regressor__min_child_samples': 10, 'estimator__regressor__num_leaves': 15}, 'differencing': 1}

=== Forecast Data ===
   district       date  actual     forecast
0  BHANDARA 2020-06-01    1228  1324.822055
1  BHANDARA 2020-07-01    1165  1290.690022
2  BHANDARA 2020-08-01    1101  1264.509939
3  BHANDARA 2020-09-01    1151  1292.552934
4  BHANDARA 2020-10-01    1152  1292.820342
5  BHANDARA 2020-11-01    1031  1321.002737
6  BHANDARA 2020-12-01    127

27 fits failed out of a total of 135.
The score on these train-test partitions for these parameters will be set to nan.
If these failures are not expected, you can try to debug them by setting error_score='raise'.

Below are more details about the failures:
--------------------------------------------------------------------------------
27 fits failed with the following error:
Traceback (most recent call last):
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sklearn\model_selection\_validation.py", line 893, in _fit_and_score
    estimator.fit(X_train, **fit_params)
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sktime\forecasting\base\_base.py", line 396, in fit
    self._fit(y=y_inner, X=X_inner, fh=fh)
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sktime\forecasting\compose\_reduce.py", line 972, in _fit
    self.estimator_.fit(Xt, yt)
  File "c:\Users\nauti\AppData\Local\Programs\P

[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000126 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 135
[LightGBM] [Info] Number of data points in the train set: 31, number of used features: 12
[LightGBM] [Info] Start training from score 29.451613
=== Metrics ===
{'district': 'BULDHANA', 'rmse': 245.4024662203009, 'best_params': {'estimator__regressor__learning_rate': 0.01, 'estimator__regressor__min_child_samples': 10, 'estimator__regressor__num_leaves': 15}, 'differencing': 1}

=== Forecast Data ===
   district       date  actual     forecast
0  BULDHANA 2020-06-01    1522  1335.125669
1  BULDHANA 2020-07-01    1439  1337.128851
2  BULDHANA 2020-08-01    1345  1484.036142
3  BULDHANA 2020-09-01    1602  1344.639599
4  BULDHANA 2020-10-01    1459  1559.126923
5  BULDHANA 2020-11-01    1389  1364.136757
6  BULDHANA 2020-12-01    1711  1413.288437
7  BULDHANA 2021-01-01    1734  1607.846025
8  BUL

27 fits failed out of a total of 135.
The score on these train-test partitions for these parameters will be set to nan.
If these failures are not expected, you can try to debug them by setting error_score='raise'.

Below are more details about the failures:
--------------------------------------------------------------------------------
27 fits failed with the following error:
Traceback (most recent call last):
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sklearn\model_selection\_validation.py", line 893, in _fit_and_score
    estimator.fit(X_train, **fit_params)
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sktime\forecasting\base\_base.py", line 396, in fit
    self._fit(y=y_inner, X=X_inner, fh=fh)
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sktime\forecasting\compose\_reduce.py", line 972, in _fit
    self.estimator_.fit(Xt, yt)
  File "c:\Users\nauti\AppData\Local\Programs\P

[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 0.000242 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 133
[LightGBM] [Info] Number of data points in the train set: 31, number of used features: 12
[LightGBM] [Info] Start training from score 35.000000
=== Metrics ===
{'district': 'CHANDRAPUR', 'rmse': 538.3196728761411, 'best_params': {'estimator__regressor__learning_rate': 0.01, 'estimator__regressor__min_child_samples': 10, 'estimator__regressor__num_leaves': 15}, 'differencing': 1}

=== Forecast Data ===
     district       date  actual     forecast
0  CHANDRAPUR 2020-06-01    2334  2719.693471
1  CHANDRAPUR 2020-07-01    2279  2874.925465
2  CHANDRAPUR 2020-08-01    2103  2679.489959
3  CHANDRAPUR 2020-09-01    2030  2701.246150
4  CHANDRAPUR 2020-10-01    2073  2687.307859
5  CHANDRAPUR 2020-11-01    1897  2719.611344
6  CHANDRAPUR 

27 fits failed out of a total of 135.
The score on these train-test partitions for these parameters will be set to nan.
If these failures are not expected, you can try to debug them by setting error_score='raise'.

Below are more details about the failures:
--------------------------------------------------------------------------------
27 fits failed with the following error:
Traceback (most recent call last):
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sklearn\model_selection\_validation.py", line 893, in _fit_and_score
    estimator.fit(X_train, **fit_params)
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sktime\forecasting\base\_base.py", line 396, in fit
    self._fit(y=y_inner, X=X_inner, fh=fh)
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sktime\forecasting\compose\_reduce.py", line 972, in _fit
    self.estimator_.fit(Xt, yt)
  File "c:\Users\nauti\AppData\Local\Programs\P

[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000672 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 134
[LightGBM] [Info] Number of data points in the train set: 31, number of used features: 12
[LightGBM] [Info] Start training from score 69.096774
=== Metrics ===
{'district': 'DHULE', 'rmse': 547.0043266047629, 'best_params': {'estimator__regressor__learning_rate': 0.01, 'estimator__regressor__min_child_samples': 10, 'estimator__regressor__num_leaves': 15}, 'differencing': 1}

=== Forecast Data ===
  district       date  actual     forecast
0    DHULE 2020-06-01    3508  3455.491371
1    DHULE 2020-07-01    3317  3624.248373
2    DHULE 2020-08-01    2764  3858.943027
3    DHULE 2020-09-01    3344  4009.338926
4    DHULE 2020-10-01    3020  3693.432676
5    DHULE 2020-11-01    2908  3389.586392
6    DHULE 2020-12-01    3477  4068.480716
7    DHULE 2021-01-01    3554  4001.558449
8    DHULE 2021-02

27 fits failed out of a total of 135.
The score on these train-test partitions for these parameters will be set to nan.
If these failures are not expected, you can try to debug them by setting error_score='raise'.

Below are more details about the failures:
--------------------------------------------------------------------------------
27 fits failed with the following error:
Traceback (most recent call last):
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sklearn\model_selection\_validation.py", line 893, in _fit_and_score
    estimator.fit(X_train, **fit_params)
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sktime\forecasting\base\_base.py", line 396, in fit
    self._fit(y=y_inner, X=X_inner, fh=fh)
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sktime\forecasting\compose\_reduce.py", line 972, in _fit
    self.estimator_.fit(Xt, yt)
  File "c:\Users\nauti\AppData\Local\Programs\P

[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000428 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 138
[LightGBM] [Info] Number of data points in the train set: 31, number of used features: 12
[LightGBM] [Info] Start training from score 22.806452
=== Metrics ===
{'district': 'GADCHIROLI', 'rmse': 436.3122950181828, 'best_params': {'estimator__regressor__learning_rate': 0.01, 'estimator__regressor__min_child_samples': 10, 'estimator__regressor__num_leaves': 15}, 'differencing': 1}

=== Forecast Data ===
     district       date  actual     forecast
0  GADCHIROLI 2020-06-01    1665  1801.116206
1  GADCHIROLI 2020-07-01    1437  1739.816725
2  GADCHIROLI 2020-08-01    1218  1595.810861
3  GADCHIROLI 2020-09-01    1327  1699.322583
4  GADCHIROLI 2020-10-01    1197  1779.289002
5  GADCHIROLI 2020-11-01    1211  1756.367893
6  GADCHIROLI 2020-12-01    1363  1850.090692
7  GADCHIROLI 2021-01-01    1302

 nan nan nan nan nan nan nan nan nan]


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000334 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 137
[LightGBM] [Info] Number of data points in the train set: 32, number of used features: 12
[LightGBM] [Info] Start training from score 1408.656250
=== Metrics ===
{'district': 'GONDIA', 'rmse': 224.84802675278357, 'best_params': {'estimator__regressor__learning_rate': 0.01, 'estimator__regressor__min_child_samples': 10, 'estimator__regressor__num_leaves': 15}, 'differencing': 0}

=== Forecast Data ===
  district       date  actual     forecast
0   GONDIA 2020-06-01    1556  1441.992675
1   GONDIA 2020-07-01    1454  1667.735732
2   GONDIA 2020-08-01    1331  1667.735732
3   GONDIA 2020-09-01    1309  1608.368008
4   GONDIA 2020-10-01    1341  1587.389937
5   GONDIA 2020-11-01    1444  1587.389937
6   GONDIA 2020-12-01    1405  1669.467748
7   GONDIA 2021-01-01    1340  1587.389937
8   GONDIA 202

27 fits failed out of a total of 135.
The score on these train-test partitions for these parameters will be set to nan.
If these failures are not expected, you can try to debug them by setting error_score='raise'.

Below are more details about the failures:
--------------------------------------------------------------------------------
27 fits failed with the following error:
Traceback (most recent call last):
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sklearn\model_selection\_validation.py", line 893, in _fit_and_score
    estimator.fit(X_train, **fit_params)
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sktime\forecasting\base\_base.py", line 396, in fit
    self._fit(y=y_inner, X=X_inner, fh=fh)
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sktime\forecasting\compose\_reduce.py", line 972, in _fit
    self.estimator_.fit(Xt, yt)
  File "c:\Users\nauti\AppData\Local\Programs\P

[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000362 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 135
[LightGBM] [Info] Number of data points in the train set: 31, number of used features: 12
[LightGBM] [Info] Start training from score 29.741935
=== Metrics ===
{'district': 'HINGOLI', 'rmse': 129.50983085407404, 'best_params': {'estimator__regressor__learning_rate': 0.01, 'estimator__regressor__min_child_samples': 10, 'estimator__regressor__num_leaves': 15}, 'differencing': 1}

=== Forecast Data ===
  district       date  actual     forecast
0  HINGOLI 2020-06-01    1667  1779.620047
1  HINGOLI 2020-07-01    1514  1829.245534
2  HINGOLI 2020-08-01    1569  1661.763304
3  HINGOLI 2020-09-01    1745  1715.950375
4  HINGOLI 2020-10-01    1749  1687.137954
5  HINGOLI 2020-11-01    1616  1707.453584
6  HINGOLI 2020-12-01    1687  1854.179927
7  HINGOLI 2021-01-01    1732  1724.562733
8  HINGOLI 2021

27 fits failed out of a total of 135.
The score on these train-test partitions for these parameters will be set to nan.
If these failures are not expected, you can try to debug them by setting error_score='raise'.

Below are more details about the failures:
--------------------------------------------------------------------------------
27 fits failed with the following error:
Traceback (most recent call last):
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sklearn\model_selection\_validation.py", line 893, in _fit_and_score
    estimator.fit(X_train, **fit_params)
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sktime\forecasting\base\_base.py", line 396, in fit
    self._fit(y=y_inner, X=X_inner, fh=fh)
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sktime\forecasting\compose\_reduce.py", line 972, in _fit
    self.estimator_.fit(Xt, yt)
  File "c:\Users\nauti\AppData\Local\Programs\P

[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000175 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 135
[LightGBM] [Info] Number of data points in the train set: 31, number of used features: 12
[LightGBM] [Info] Start training from score 86.580645
=== Metrics ===
{'district': 'JALGAON', 'rmse': 1556.6694401004768, 'best_params': {'estimator__regressor__learning_rate': 0.01, 'estimator__regressor__min_child_samples': 10, 'estimator__regressor__num_leaves': 15}, 'differencing': 1}

=== Forecast Data ===
  district       date  actual     forecast
0  JALGAON 2020-06-01    5556  5614.077533
1  JALGAON 2020-07-01    4641  5878.480336
2  JALGAON 2020-08-01    4335  6232.810720
3  JALGAON 2020-09-01    4806  6454.095017
4  JALGAON 2020-10-01    4731  6284.648117
5  JALGAON 2020-11-01    4652  6638.978500
6  JALGAON 2020-12-01    5392  6996.971946
7  JALGAON 2021-01-01    5235  6918.213068
8  JALGAON 2021

 nan nan nan nan nan nan nan nan nan]


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000292 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 134
[LightGBM] [Info] Number of data points in the train set: 32, number of used features: 12
[LightGBM] [Info] Start training from score 1663.281250
=== Metrics ===
{'district': 'JALNA', 'rmse': 225.01111550570872, 'best_params': {'estimator__regressor__learning_rate': 0.01, 'estimator__regressor__min_child_samples': 10, 'estimator__regressor__num_leaves': 15}, 'differencing': 0}

=== Forecast Data ===
  district       date  actual     forecast
0    JALNA 2020-06-01    1935  1762.437506
1    JALNA 2020-07-01    2128  1762.437506
2    JALNA 2020-08-01    1604  1762.437506
3    JALNA 2020-09-01    1731  1762.437506
4    JALNA 2020-10-01    1698  1762.437506
5    JALNA 2020-11-01    1869  1762.437506
6    JALNA 2020-12-01    2109  1762.437506
7    JALNA 2021-01-01    2118  1762.437506
8    JALNA 2021

27 fits failed out of a total of 135.
The score on these train-test partitions for these parameters will be set to nan.
If these failures are not expected, you can try to debug them by setting error_score='raise'.

Below are more details about the failures:
--------------------------------------------------------------------------------
27 fits failed with the following error:
Traceback (most recent call last):
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sklearn\model_selection\_validation.py", line 893, in _fit_and_score
    estimator.fit(X_train, **fit_params)
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sktime\forecasting\base\_base.py", line 396, in fit
    self._fit(y=y_inner, X=X_inner, fh=fh)
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sktime\forecasting\compose\_reduce.py", line 972, in _fit
    self.estimator_.fit(Xt, yt)
  File "c:\Users\nauti\AppData\Local\Programs\P

[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000249 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 137
[LightGBM] [Info] Number of data points in the train set: 31, number of used features: 12
[LightGBM] [Info] Start training from score 50.645161
=== Metrics ===
{'district': 'KOLHAPUR', 'rmse': 407.79454340238385, 'best_params': {'estimator__regressor__learning_rate': 0.01, 'estimator__regressor__min_child_samples': 10, 'estimator__regressor__num_leaves': 15}, 'differencing': 1}

=== Forecast Data ===
   district       date  actual     forecast
0  KOLHAPUR 2020-06-01    3692  3815.047287
1  KOLHAPUR 2020-07-01    3357  3759.029977
2  KOLHAPUR 2020-08-01    3163  3985.343696
3  KOLHAPUR 2020-09-01    3576  3935.478233
4  KOLHAPUR 2020-10-01    3711  3940.816938
5  KOLHAPUR 2020-11-01    3480  4165.512923
6  KOLHAPUR 2020-12-01    4336  4030.584734
7  KOLHAPUR 2021-01-01    4042  4112.986635
8  KO

27 fits failed out of a total of 135.
The score on these train-test partitions for these parameters will be set to nan.
If these failures are not expected, you can try to debug them by setting error_score='raise'.

Below are more details about the failures:
--------------------------------------------------------------------------------
27 fits failed with the following error:
Traceback (most recent call last):
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sklearn\model_selection\_validation.py", line 893, in _fit_and_score
    estimator.fit(X_train, **fit_params)
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sktime\forecasting\base\_base.py", line 396, in fit
    self._fit(y=y_inner, X=X_inner, fh=fh)
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sktime\forecasting\compose\_reduce.py", line 972, in _fit
    self.estimator_.fit(Xt, yt)
  File "c:\Users\nauti\AppData\Local\Programs\P

[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000206 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 136
[LightGBM] [Info] Number of data points in the train set: 31, number of used features: 12
[LightGBM] [Info] Start training from score 70.774194
=== Metrics ===
{'district': 'LATUR', 'rmse': 492.8846785692674, 'best_params': {'estimator__regressor__learning_rate': 0.01, 'estimator__regressor__min_child_samples': 10, 'estimator__regressor__num_leaves': 15}, 'differencing': 1}

=== Forecast Data ===
  district       date  actual     forecast
0    LATUR 2020-06-01    3784  3862.204204
1    LATUR 2020-07-01    3500  3926.116553
2    LATUR 2020-08-01    3274  3779.002330
3    LATUR 2020-09-01    3634  4141.507700
4    LATUR 2020-10-01    3408  4007.894706
5    LATUR 2020-11-01    3363  4122.107013
6    LATUR 2020-12-01    3601  4052.088921
7    LATUR 2021-01-01    3699  4056.024891
8    LATUR 2021-02

27 fits failed out of a total of 135.
The score on these train-test partitions for these parameters will be set to nan.
If these failures are not expected, you can try to debug them by setting error_score='raise'.

Below are more details about the failures:
--------------------------------------------------------------------------------
27 fits failed with the following error:
Traceback (most recent call last):
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sklearn\model_selection\_validation.py", line 893, in _fit_and_score
    estimator.fit(X_train, **fit_params)
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sktime\forecasting\base\_base.py", line 396, in fit
    self._fit(y=y_inner, X=X_inner, fh=fh)
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sktime\forecasting\compose\_reduce.py", line 972, in _fit
    self.estimator_.fit(Xt, yt)
  File "c:\Users\nauti\AppData\Local\Programs\P

[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000283 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 136
[LightGBM] [Info] Number of data points in the train set: 31, number of used features: 12
[LightGBM] [Info] Start training from score -140.548387
=== Metrics ===
{'district': 'MUMBAI', 'rmse': 6963.11117199351, 'best_params': {'estimator__regressor__learning_rate': 0.01, 'estimator__regressor__min_child_samples': 10, 'estimator__regressor__num_leaves': 15}, 'differencing': 1}

=== Forecast Data ===
  district       date  actual     forecast
0   MUMBAI 2020-06-01    1485  -988.050694
1   MUMBAI 2020-07-01    1525  -824.096190
2   MUMBAI 2020-08-01    1497 -2635.944621
3   MUMBAI 2020-09-01    1472 -3420.612506
4   MUMBAI 2020-10-01    1756 -5319.415694
5   MUMBAI 2020-11-01    2196 -3909.882370
6   MUMBAI 2020-12-01    2738 -5848.933064
7   MUMBAI 2021-01-01    2397 -5684.978560
8   MUMBAI 2021-

27 fits failed out of a total of 135.
The score on these train-test partitions for these parameters will be set to nan.
If these failures are not expected, you can try to debug them by setting error_score='raise'.

Below are more details about the failures:
--------------------------------------------------------------------------------
27 fits failed with the following error:
Traceback (most recent call last):
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sklearn\model_selection\_validation.py", line 893, in _fit_and_score
    estimator.fit(X_train, **fit_params)
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sktime\forecasting\base\_base.py", line 396, in fit
    self._fit(y=y_inner, X=X_inner, fh=fh)
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sktime\forecasting\compose\_reduce.py", line 972, in _fit
    self.estimator_.fit(Xt, yt)
  File "c:\Users\nauti\AppData\Local\Programs\P

[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000535 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 135
[LightGBM] [Info] Number of data points in the train set: 31, number of used features: 12
[LightGBM] [Info] Start training from score 53.225806
=== Metrics ===
{'district': 'NAGPUR', 'rmse': 932.0572047893311, 'best_params': {'estimator__regressor__learning_rate': 0.01, 'estimator__regressor__min_child_samples': 10, 'estimator__regressor__num_leaves': 15}, 'differencing': 1}

=== Forecast Data ===
  district       date  actual     forecast
0   NAGPUR 2020-06-01    5763  5097.345774
1   NAGPUR 2020-07-01    5816  5032.340920
2   NAGPUR 2020-08-01    4461  5893.264171
3   NAGPUR 2020-09-01    4485  5731.636867
4   NAGPUR 2020-10-01    4837  5768.246075
5   NAGPUR 2020-11-01    5721  5833.592814
6   NAGPUR 2020-12-01    6553  5775.382016
7   NAGPUR 2021-01-01    6620  6319.213043
8   NAGPUR 2021-0

 nan nan nan nan nan nan nan nan nan]


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000159 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 137
[LightGBM] [Info] Number of data points in the train set: 32, number of used features: 12
[LightGBM] [Info] Start training from score 4390.562500
=== Metrics ===
{'district': 'NANDED', 'rmse': 302.4556472104022, 'best_params': {'estimator__regressor__learning_rate': 0.01, 'estimator__regressor__min_child_samples': 10, 'estimator__regressor__num_leaves': 15}, 'differencing': 0}

=== Forecast Data ===
  district       date  actual     forecast
0   NANDED 2020-06-01    4882  4766.144519
1   NANDED 2020-07-01    4668  4558.023988
2   NANDED 2020-08-01    4358  4558.023988
3   NANDED 2020-09-01    5176  4558.023988
4   NANDED 2020-10-01    4553  4558.023988
5   NANDED 2020-11-01    4475  4622.540152
6   NANDED 2020-12-01    4906  4558.023988
7   NANDED 2021-01-01    5001  4766.144519
8   NANDED 2021

27 fits failed out of a total of 135.
The score on these train-test partitions for these parameters will be set to nan.
If these failures are not expected, you can try to debug them by setting error_score='raise'.

Below are more details about the failures:
--------------------------------------------------------------------------------
27 fits failed with the following error:
Traceback (most recent call last):
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sklearn\model_selection\_validation.py", line 893, in _fit_and_score
    estimator.fit(X_train, **fit_params)
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sktime\forecasting\base\_base.py", line 396, in fit
    self._fit(y=y_inner, X=X_inner, fh=fh)
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sktime\forecasting\compose\_reduce.py", line 972, in _fit
    self.estimator_.fit(Xt, yt)
  File "c:\Users\nauti\AppData\Local\Programs\P

[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000189 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 138
[LightGBM] [Info] Number of data points in the train set: 31, number of used features: 12
[LightGBM] [Info] Start training from score 65.516129
=== Metrics ===
{'district': 'NANDURBAR', 'rmse': 1300.812304371049, 'best_params': {'estimator__regressor__learning_rate': 0.01, 'estimator__regressor__min_child_samples': 10, 'estimator__regressor__num_leaves': 15}, 'differencing': 1}

=== Forecast Data ===
    district       date  actual     forecast
0  NANDURBAR 2020-06-01    3463  3531.139798
1  NANDURBAR 2020-07-01    3193  3836.546761
2  NANDURBAR 2020-08-01    2585  3734.730023
3  NANDURBAR 2020-09-01    2762  4058.219216
4  NANDURBAR 2020-10-01    2322  3868.145454
5  NANDURBAR 2020-11-01    2311  4191.634648
6  NANDURBAR 2020-12-01    2661  3857.120627
7  NANDURBAR 2021-01-01    2528  4248.325

27 fits failed out of a total of 135.
The score on these train-test partitions for these parameters will be set to nan.
If these failures are not expected, you can try to debug them by setting error_score='raise'.

Below are more details about the failures:
--------------------------------------------------------------------------------
27 fits failed with the following error:
Traceback (most recent call last):
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sklearn\model_selection\_validation.py", line 893, in _fit_and_score
    estimator.fit(X_train, **fit_params)
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sktime\forecasting\base\_base.py", line 396, in fit
    self._fit(y=y_inner, X=X_inner, fh=fh)
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sktime\forecasting\compose\_reduce.py", line 972, in _fit
    self.estimator_.fit(Xt, yt)
  File "c:\Users\nauti\AppData\Local\Programs\P

[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000359 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 137
[LightGBM] [Info] Number of data points in the train set: 31, number of used features: 12
[LightGBM] [Info] Start training from score 127.000000
=== Metrics ===
{'district': 'NASHIK', 'rmse': 482.14604415317405, 'best_params': {'estimator__regressor__learning_rate': 0.01, 'estimator__regressor__min_child_samples': 10, 'estimator__regressor__num_leaves': 15}, 'differencing': 1}

=== Forecast Data ===
  district       date  actual     forecast
0   NASHIK 2020-06-01    6593  6746.636849
1   NASHIK 2020-07-01    6411  6951.896748
2   NASHIK 2020-08-01    6147  6989.588482
3   NASHIK 2020-09-01    6180  7025.735617
4   NASHIK 2020-10-01    6938  6974.733412
5   NASHIK 2020-11-01    7314  6910.872088
6   NASHIK 2020-12-01    7560  7353.082625
7   NASHIK 2021-01-01    7807  7814.126897
8   NASHIK 2021

27 fits failed out of a total of 135.
The score on these train-test partitions for these parameters will be set to nan.
If these failures are not expected, you can try to debug them by setting error_score='raise'.

Below are more details about the failures:
--------------------------------------------------------------------------------
27 fits failed with the following error:
Traceback (most recent call last):
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sklearn\model_selection\_validation.py", line 893, in _fit_and_score
    estimator.fit(X_train, **fit_params)
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sktime\forecasting\base\_base.py", line 396, in fit
    self._fit(y=y_inner, X=X_inner, fh=fh)
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sktime\forecasting\compose\_reduce.py", line 972, in _fit
    self.estimator_.fit(Xt, yt)
  File "c:\Users\nauti\AppData\Local\Programs\P

[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000287 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 137
[LightGBM] [Info] Number of data points in the train set: 31, number of used features: 12
[LightGBM] [Info] Start training from score 33.290323
=== Metrics ===
{'district': 'OSMANABAD', 'rmse': 340.3749612397408, 'best_params': {'estimator__regressor__learning_rate': 0.01, 'estimator__regressor__min_child_samples': 10, 'estimator__regressor__num_leaves': 15}, 'differencing': 1}

=== Forecast Data ===
    district       date  actual     forecast
0  OSMANABAD 2020-06-01    1977  2227.982714
1  OSMANABAD 2020-07-01    1856  2180.919998
2  OSMANABAD 2020-08-01    1675  2227.523058
3  OSMANABAD 2020-09-01    1793  2348.312243
4  OSMANABAD 2020-10-01    1701  2122.552145
5  OSMANABAD 2020-11-01    1857  2104.870134
6  OSMANABAD 2020-12-01    2177  2202.343951
7  OSMANABAD 2021-01-01    2344  2437.917

27 fits failed out of a total of 135.
The score on these train-test partitions for these parameters will be set to nan.
If these failures are not expected, you can try to debug them by setting error_score='raise'.

Below are more details about the failures:
--------------------------------------------------------------------------------
27 fits failed with the following error:
Traceback (most recent call last):
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sklearn\model_selection\_validation.py", line 893, in _fit_and_score
    estimator.fit(X_train, **fit_params)
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sktime\forecasting\base\_base.py", line 396, in fit
    self._fit(y=y_inner, X=X_inner, fh=fh)
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sktime\forecasting\compose\_reduce.py", line 972, in _fit
    self.estimator_.fit(Xt, yt)
  File "c:\Users\nauti\AppData\Local\Programs\P

[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000173 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 138
[LightGBM] [Info] Number of data points in the train set: 31, number of used features: 12
[LightGBM] [Info] Start training from score 32.516129
=== Metrics ===
{'district': 'PALGHAR', 'rmse': 599.1783115017296, 'best_params': {'estimator__regressor__learning_rate': 0.01, 'estimator__regressor__min_child_samples': 10, 'estimator__regressor__num_leaves': 15}, 'differencing': 1}

=== Forecast Data ===
  district       date  actual     forecast
0  PALGHAR 2020-06-01    3663  3962.343823
1  PALGHAR 2020-07-01    3371  3870.552469
2  PALGHAR 2020-08-01    3171  3797.050142
3  PALGHAR 2020-09-01    3269  4018.371640
4  PALGHAR 2020-10-01    3271  4191.715463
5  PALGHAR 2020-11-01    3189  4070.235460
6  PALGHAR 2020-12-01    3657  3996.733133
7  PALGHAR 2021-01-01    3513  4116.468047
8  PALGHAR 2021-

27 fits failed out of a total of 135.
The score on these train-test partitions for these parameters will be set to nan.
If these failures are not expected, you can try to debug them by setting error_score='raise'.

Below are more details about the failures:
--------------------------------------------------------------------------------
27 fits failed with the following error:
Traceback (most recent call last):
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sklearn\model_selection\_validation.py", line 893, in _fit_and_score
    estimator.fit(X_train, **fit_params)
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sktime\forecasting\base\_base.py", line 396, in fit
    self._fit(y=y_inner, X=X_inner, fh=fh)
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sktime\forecasting\compose\_reduce.py", line 972, in _fit
    self.estimator_.fit(Xt, yt)
  File "c:\Users\nauti\AppData\Local\Programs\P

[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000243 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 137
[LightGBM] [Info] Number of data points in the train set: 31, number of used features: 12
[LightGBM] [Info] Start training from score 18.483871
=== Metrics ===
{'district': 'PARBHANI', 'rmse': 156.2212721629605, 'best_params': {'estimator__regressor__learning_rate': 0.01, 'estimator__regressor__min_child_samples': 10, 'estimator__regressor__num_leaves': 15}, 'differencing': 1}

=== Forecast Data ===
   district       date  actual     forecast
0  PARBHANI 2020-06-01    1546  1521.987571
1  PARBHANI 2020-07-01    1441  1437.188650
2  PARBHANI 2020-08-01    1144  1321.965987
3  PARBHANI 2020-09-01    1478  1394.741074
4  PARBHANI 2020-10-01    1580  1380.601264
5  PARBHANI 2020-11-01    1311  1510.460287
6  PARBHANI 2020-12-01    1730  1425.661366
7  PARBHANI 2021-01-01    1473  1474.410000
8  PAR

 nan nan nan nan nan nan nan nan nan]


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000312 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 136
[LightGBM] [Info] Number of data points in the train set: 32, number of used features: 12
[LightGBM] [Info] Start training from score 6821.031250
=== Metrics ===
{'district': 'PUNE', 'rmse': 1063.1931967118298, 'best_params': {'estimator__regressor__learning_rate': 0.01, 'estimator__regressor__min_child_samples': 10, 'estimator__regressor__num_leaves': 15}, 'differencing': 0}

=== Forecast Data ===
  district       date  actual     forecast
0     PUNE 2020-06-01    6054  6165.487472
1     PUNE 2020-07-01    5520  6242.399726
2     PUNE 2020-08-01    5630  6359.206225
3     PUNE 2020-09-01    5491  7432.809974
4     PUNE 2020-10-01    6135  7786.121743
5     PUNE 2020-11-01    6162  7268.052845
6     PUNE 2020-12-01    7696  7161.147154
7     PUNE 2021-01-01    7485  7042.806122
8     PUNE 2021-

27 fits failed out of a total of 135.
The score on these train-test partitions for these parameters will be set to nan.
If these failures are not expected, you can try to debug them by setting error_score='raise'.

Below are more details about the failures:
--------------------------------------------------------------------------------
27 fits failed with the following error:
Traceback (most recent call last):
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sklearn\model_selection\_validation.py", line 893, in _fit_and_score
    estimator.fit(X_train, **fit_params)
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sktime\forecasting\base\_base.py", line 396, in fit
    self._fit(y=y_inner, X=X_inner, fh=fh)
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sktime\forecasting\compose\_reduce.py", line 972, in _fit
    self.estimator_.fit(Xt, yt)
  File "c:\Users\nauti\AppData\Local\Programs\P

[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000189 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 138
[LightGBM] [Info] Number of data points in the train set: 31, number of used features: 12
[LightGBM] [Info] Start training from score 18.516129
=== Metrics ===
{'district': 'RAIGAD', 'rmse': 862.2707732833808, 'best_params': {'estimator__regressor__learning_rate': 0.01, 'estimator__regressor__min_child_samples': 10, 'estimator__regressor__num_leaves': 15}, 'differencing': 1}

=== Forecast Data ===
  district       date  actual     forecast
0   RAIGAD 2020-06-01    1582  1839.262239
1   RAIGAD 2020-07-01    1563  1693.041614
2   RAIGAD 2020-08-01    1516  1914.990646
3   RAIGAD 2020-09-01    1568  1968.571252
4   RAIGAD 2020-10-01    1569  1796.417096
5   RAIGAD 2020-11-01    2801  2300.501768
6   RAIGAD 2020-12-01    3265  2149.222365
7   RAIGAD 2021-01-01    3701  2174.167865
8   RAIGAD 2021-0

27 fits failed out of a total of 135.
The score on these train-test partitions for these parameters will be set to nan.
If these failures are not expected, you can try to debug them by setting error_score='raise'.

Below are more details about the failures:
--------------------------------------------------------------------------------
27 fits failed with the following error:
Traceback (most recent call last):
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sklearn\model_selection\_validation.py", line 893, in _fit_and_score
    estimator.fit(X_train, **fit_params)
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sktime\forecasting\base\_base.py", line 396, in fit
    self._fit(y=y_inner, X=X_inner, fh=fh)
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sktime\forecasting\compose\_reduce.py", line 972, in _fit
    self.estimator_.fit(Xt, yt)
  File "c:\Users\nauti\AppData\Local\Programs\P

[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000270 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 133
[LightGBM] [Info] Number of data points in the train set: 31, number of used features: 12
[LightGBM] [Info] Start training from score 8.161290
=== Metrics ===
{'district': 'RATNAGIRI', 'rmse': 124.13697554938376, 'best_params': {'estimator__regressor__learning_rate': 0.01, 'estimator__regressor__min_child_samples': 10, 'estimator__regressor__num_leaves': 15}, 'differencing': 1}

=== Forecast Data ===
    district       date  actual    forecast
0  RATNAGIRI 2020-06-01     848  671.298306
1  RATNAGIRI 2020-07-01     772  742.857089
2  RATNAGIRI 2020-08-01     803  657.155955
3  RATNAGIRI 2020-09-01     545  747.375168
4  RATNAGIRI 2020-10-01     679  659.907681
5  RATNAGIRI 2020-11-01     551  765.421066
6  RATNAGIRI 2020-12-01     665  677.953579
7  RATNAGIRI 2021-01-01     683  783.466964
8  RA

27 fits failed out of a total of 135.
The score on these train-test partitions for these parameters will be set to nan.
If these failures are not expected, you can try to debug them by setting error_score='raise'.

Below are more details about the failures:
--------------------------------------------------------------------------------
27 fits failed with the following error:
Traceback (most recent call last):
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sklearn\model_selection\_validation.py", line 893, in _fit_and_score
    estimator.fit(X_train, **fit_params)
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sktime\forecasting\base\_base.py", line 396, in fit
    self._fit(y=y_inner, X=X_inner, fh=fh)
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sktime\forecasting\compose\_reduce.py", line 972, in _fit
    self.estimator_.fit(Xt, yt)
  File "c:\Users\nauti\AppData\Local\Programs\P

[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000310 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 134
[LightGBM] [Info] Number of data points in the train set: 31, number of used features: 12
[LightGBM] [Info] Start training from score 20.225806
=== Metrics ===
{'district': 'SANGLI', 'rmse': 160.46560541494384, 'best_params': {'estimator__regressor__learning_rate': 0.01, 'estimator__regressor__min_child_samples': 10, 'estimator__regressor__num_leaves': 15}, 'differencing': 1}

=== Forecast Data ===
  district       date  actual     forecast
0   SANGLI 2020-06-01    1724  1620.454755
1   SANGLI 2020-07-01    1914  1780.792962
2   SANGLI 2020-08-01    1544  1659.858301
3   SANGLI 2020-09-01    1534  1678.408252
4   SANGLI 2020-10-01    1492  1805.814330
5   SANGLI 2020-11-01    1581  1658.976551
6   SANGLI 2020-12-01    1633  1623.777214
7   SANGLI 2021-01-01    1529  1751.183292
8   SANGLI 2021-

27 fits failed out of a total of 135.
The score on these train-test partitions for these parameters will be set to nan.
If these failures are not expected, you can try to debug them by setting error_score='raise'.

Below are more details about the failures:
--------------------------------------------------------------------------------
27 fits failed with the following error:
Traceback (most recent call last):
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sklearn\model_selection\_validation.py", line 893, in _fit_and_score
    estimator.fit(X_train, **fit_params)
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sktime\forecasting\base\_base.py", line 396, in fit
    self._fit(y=y_inner, X=X_inner, fh=fh)
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sktime\forecasting\compose\_reduce.py", line 972, in _fit
    self.estimator_.fit(Xt, yt)
  File "c:\Users\nauti\AppData\Local\Programs\P

[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000234 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 133
[LightGBM] [Info] Number of data points in the train set: 31, number of used features: 12
[LightGBM] [Info] Start training from score 7.516129
=== Metrics ===
{'district': 'SATARA', 'rmse': 2095.2165151787863, 'best_params': {'estimator__regressor__learning_rate': 0.01, 'estimator__regressor__min_child_samples': 10, 'estimator__regressor__num_leaves': 15}, 'differencing': 1}

=== Forecast Data ===
  district       date  actual     forecast
0   SATARA 2020-06-01    2237  1999.990414
1   SATARA 2020-07-01    2118  2092.482131
2   SATARA 2020-08-01    1561  2115.016698
3   SATARA 2020-09-01    1380  2075.083641
4   SATARA 2020-10-01    1570  2041.146972
5   SATARA 2020-11-01    1571  2067.436531
6   SATARA 2020-12-01    2220  2156.127428
7   SATARA 2021-01-01    2617  2184.592097
8   SATARA 2021-0

27 fits failed out of a total of 135.
The score on these train-test partitions for these parameters will be set to nan.
If these failures are not expected, you can try to debug them by setting error_score='raise'.

Below are more details about the failures:
--------------------------------------------------------------------------------
27 fits failed with the following error:
Traceback (most recent call last):
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sklearn\model_selection\_validation.py", line 893, in _fit_and_score
    estimator.fit(X_train, **fit_params)
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sktime\forecasting\base\_base.py", line 396, in fit
    self._fit(y=y_inner, X=X_inner, fh=fh)
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sktime\forecasting\compose\_reduce.py", line 972, in _fit
    self.estimator_.fit(Xt, yt)
  File "c:\Users\nauti\AppData\Local\Programs\P

[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000221 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 134
[LightGBM] [Info] Number of data points in the train set: 31, number of used features: 12
[LightGBM] [Info] Start training from score 6.258065
=== Metrics ===
{'district': 'SINDHUDURG', 'rmse': 68.83356813529052, 'best_params': {'estimator__regressor__learning_rate': 0.01, 'estimator__regressor__min_child_samples': 10, 'estimator__regressor__num_leaves': 15}, 'differencing': 1}

=== Forecast Data ===
     district       date  actual    forecast
0  SINDHUDURG 2020-06-01     420  405.750668
1  SINDHUDURG 2020-07-01     500  456.006873
2  SINDHUDURG 2020-08-01     376  441.400808
3  SINDHUDURG 2020-09-01     367  390.064275
4  SINDHUDURG 2020-10-01     361  379.178721
5  SINDHUDURG 2020-11-01     322  413.580684
6  SINDHUDURG 2020-12-01     359  396.803723
7  SINDHUDURG 2021-01-01     462  367.551

27 fits failed out of a total of 135.
The score on these train-test partitions for these parameters will be set to nan.
If these failures are not expected, you can try to debug them by setting error_score='raise'.

Below are more details about the failures:
--------------------------------------------------------------------------------
27 fits failed with the following error:
Traceback (most recent call last):
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sklearn\model_selection\_validation.py", line 893, in _fit_and_score
    estimator.fit(X_train, **fit_params)
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sktime\forecasting\base\_base.py", line 396, in fit
    self._fit(y=y_inner, X=X_inner, fh=fh)
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sktime\forecasting\compose\_reduce.py", line 972, in _fit
    self.estimator_.fit(Xt, yt)
  File "c:\Users\nauti\AppData\Local\Programs\P

[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000249 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 136
[LightGBM] [Info] Number of data points in the train set: 31, number of used features: 12
[LightGBM] [Info] Start training from score 84.419355
=== Metrics ===
{'district': 'SOLAPUR', 'rmse': 778.4293439263108, 'best_params': {'estimator__regressor__learning_rate': 0.01, 'estimator__regressor__min_child_samples': 10, 'estimator__regressor__num_leaves': 15}, 'differencing': 1}

=== Forecast Data ===
  district       date  actual     forecast
0  SOLAPUR 2020-06-01    4094  4750.905946
1  SOLAPUR 2020-07-01    3821  4733.149231
2  SOLAPUR 2020-08-01    3842  4578.235237
3  SOLAPUR 2020-09-01    4147  5067.931021
4  SOLAPUR 2020-10-01    3847  4856.287586
5  SOLAPUR 2020-11-01    3885  5312.625053
6  SOLAPUR 2020-12-01    5349  5343.973238
7  SOLAPUR 2021-01-01    4991  4997.262912
8  SOLAPUR 2021-

27 fits failed out of a total of 135.
The score on these train-test partitions for these parameters will be set to nan.
If these failures are not expected, you can try to debug them by setting error_score='raise'.

Below are more details about the failures:
--------------------------------------------------------------------------------
27 fits failed with the following error:
Traceback (most recent call last):
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sklearn\model_selection\_validation.py", line 893, in _fit_and_score
    estimator.fit(X_train, **fit_params)
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sktime\forecasting\base\_base.py", line 396, in fit
    self._fit(y=y_inner, X=X_inner, fh=fh)
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sktime\forecasting\compose\_reduce.py", line 972, in _fit
    self.estimator_.fit(Xt, yt)
  File "c:\Users\nauti\AppData\Local\Programs\P

[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000273 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 134
[LightGBM] [Info] Number of data points in the train set: 31, number of used features: 12
[LightGBM] [Info] Start training from score 99.741935
=== Metrics ===
{'district': 'THANE', 'rmse': 1097.2292708742393, 'best_params': {'estimator__regressor__learning_rate': 0.01, 'estimator__regressor__min_child_samples': 10, 'estimator__regressor__num_leaves': 15}, 'differencing': 1}

=== Forecast Data ===
  district       date  actual      forecast
0    THANE 2020-06-01   10413   8617.008393
1    THANE 2020-07-01    9367   9011.295490
2    THANE 2020-08-01    9815   8891.637580
3    THANE 2020-09-01    9676   8958.715384
4    THANE 2020-10-01    9483   9926.621577
5    THANE 2020-11-01   10375   9997.212973
6    THANE 2020-12-01   11389  10109.429249
7    THANE 2021-01-01   11881  10278.939922
8    THA

 nan nan nan nan nan nan nan nan nan]


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000299 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 136
[LightGBM] [Info] Number of data points in the train set: 32, number of used features: 12
[LightGBM] [Info] Start training from score 1402.968750
=== Metrics ===
{'district': 'WARDHA', 'rmse': 213.09806354559623, 'best_params': {'estimator__regressor__learning_rate': 0.01, 'estimator__regressor__min_child_samples': 10, 'estimator__regressor__num_leaves': 15}, 'differencing': 0}

=== Forecast Data ===
  district       date  actual     forecast
0   WARDHA 2020-06-01    1271  1403.201618
1   WARDHA 2020-07-01    1258  1470.632234
2   WARDHA 2020-08-01    1219  1405.185174
3   WARDHA 2020-09-01    1186  1432.782946
4   WARDHA 2020-10-01    1151  1360.775245
5   WARDHA 2020-11-01    1033  1492.272375
6   WARDHA 2020-12-01    1337  1523.638640
7   WARDHA 2021-01-01    1369  1351.890163
8   WARDHA 202

27 fits failed out of a total of 135.
The score on these train-test partitions for these parameters will be set to nan.
If these failures are not expected, you can try to debug them by setting error_score='raise'.

Below are more details about the failures:
--------------------------------------------------------------------------------
27 fits failed with the following error:
Traceback (most recent call last):
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sklearn\model_selection\_validation.py", line 893, in _fit_and_score
    estimator.fit(X_train, **fit_params)
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sktime\forecasting\base\_base.py", line 396, in fit
    self._fit(y=y_inner, X=X_inner, fh=fh)
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sktime\forecasting\compose\_reduce.py", line 972, in _fit
    self.estimator_.fit(Xt, yt)
  File "c:\Users\nauti\AppData\Local\Programs\P

[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000351 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 137
[LightGBM] [Info] Number of data points in the train set: 31, number of used features: 12
[LightGBM] [Info] Start training from score 17.548387
=== Metrics ===
{'district': 'WASHIM', 'rmse': 169.63376947277234, 'best_params': {'estimator__regressor__learning_rate': 0.01, 'estimator__regressor__min_child_samples': 10, 'estimator__regressor__num_leaves': 15}, 'differencing': 1}

=== Forecast Data ===
  district       date  actual     forecast
0   WASHIM 2020-06-01    1316  1439.826398
1   WASHIM 2020-07-01    1320  1490.293450
2   WASHIM 2020-08-01    1354  1462.131104
3   WASHIM 2020-09-01    1281  1621.510079
4   WASHIM 2020-10-01    1304  1499.822737
5   WASHIM 2020-11-01    1237  1453.962813
6   WASHIM 2020-12-01    1499  1469.037664
7   WASHIM 2021-01-01    1392  1513.406725
8   WASHIM 2021-

 nan nan nan nan nan nan nan nan nan]


[LightGBM] [Info] Auto-choosing col-wise multi-threading, the overhead of testing was 0.000212 seconds.
You can set `force_col_wise=true` to remove the overhead.
[LightGBM] [Info] Total Bins 137
[LightGBM] [Info] Number of data points in the train set: 32, number of used features: 12
[LightGBM] [Info] Start training from score 2961.812500
=== Metrics ===
{'district': 'YAVATMAL', 'rmse': 376.22293699116557, 'best_params': {'estimator__regressor__learning_rate': 0.01, 'estimator__regressor__min_child_samples': 10, 'estimator__regressor__num_leaves': 15}, 'differencing': 0}

=== Forecast Data ===
   district       date  actual     forecast
0  YAVATMAL 2020-06-01    3011  2635.153615
1  YAVATMAL 2020-07-01    3187  2689.589064
2  YAVATMAL 2020-08-01    2613  2804.205895
3  YAVATMAL 2020-09-01    2629  2657.095183
4  YAVATMAL 2020-10-01    2797  2810.503102
5  YAVATMAL 2020-11-01    2682  2800.857796
6  YAVATMAL 2020-12-01    3140  2883.395480
7  YAVATMAL 2021-01-01    3105  2883.395480
8  

ValueError: 
All the 135 fits failed.
It is very likely that your model is misconfigured.
You can try to debug the error by setting error_score='raise'.

Below are more details about the failures:
--------------------------------------------------------------------------------
108 fits failed with the following error:
Traceback (most recent call last):
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sklearn\model_selection\_validation.py", line 893, in _fit_and_score
    estimator.fit(X_train, **fit_params)
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sktime\forecasting\base\_base.py", line 396, in fit
    self._fit(y=y_inner, X=X_inner, fh=fh)
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sktime\forecasting\compose\_reduce.py", line 963, in _fit
    yt, Xt = self._transform(y, X)
             ^^^^^^^^^^^^^^^^^^^^^
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sktime\forecasting\compose\_reduce.py", line 870, in _transform
    return _sliding_window_transform(
           ^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sktime\forecasting\compose\_reduce.py", line 139, in _sliding_window_transform
    yt, Xt = _sliding_window_trans_f(y=y, X=X, window_length=window_length, **kwargs)
             ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sktime\forecasting\compose\_reduce.py", line 161, in _sliding_window_transform_local
    raise ValueError(
ValueError: The `window_length` and `fh` are incompatible with the length of `y`

--------------------------------------------------------------------------------
27 fits failed with the following error:
Traceback (most recent call last):
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sklearn\model_selection\_validation.py", line 893, in _fit_and_score
    estimator.fit(X_train, **fit_params)
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sktime\forecasting\base\_base.py", line 396, in fit
    self._fit(y=y_inner, X=X_inner, fh=fh)
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sktime\forecasting\compose\_reduce.py", line 972, in _fit
    self.estimator_.fit(Xt, yt)
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sklearn\base.py", line 1474, in wrapper
    return fit_method(estimator, *args, **kwargs)
           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sklearn\pipeline.py", line 475, in fit
    self._final_estimator.fit(Xt, y, **last_step_params["fit"])
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\lightgbm\sklearn.py", line 1398, in fit
    super().fit(
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\lightgbm\sklearn.py", line 949, in fit
    _X, _y = _LGBMValidateData(
             ^^^^^^^^^^^^^^^^^^
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\lightgbm\compat.py", line 78, in validate_data
    X, y = check_X_y(
           ^^^^^^^^^^
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sklearn\utils\validation.py", line 1263, in check_X_y
    X = check_array(
        ^^^^^^^^^^^^
  File "c:\Users\nauti\AppData\Local\Programs\Python\Python311\Lib\site-packages\sklearn\utils\validation.py", line 1072, in check_array
    raise ValueError(
ValueError: Found array with 1 sample(s) (shape=(1, 12)) while a minimum of 2 is required.


In [None]:
# !pip install "dask<2025.1"
