In [2]:
import pandas as pd

from timeseries_module.main import main
from timeseries_module.missing_values.methods import (
    fill_forward, fill_backward, linear_interpolation, window_mean
)
from timeseries_module.outliers.methods import (
    remove_outliers_zscore, remove_outliers_iqr, remove_outliers_lof, remove_outliers_linear_regression
)
from timeseries_module.rolling.methods import (
    rolling_mean, rolling_max, rolling_median, rolling_min, rolling_quantile, rolling_std, rolling_sum, rolling_var
)



In [2]:
df = pd.read_csv('data/4threads.csv')

clean = main(
    input_df=df,
    output_path="output/4threads",
    outlier_sensitivity_degree="high",
    value_column="cpu_utilization_percent",
    missing_value_function=None,            
    outlier_fn=remove_outliers_zscore,
    time_column="time",
    rolling_fn=rolling_mean,                
    rolling_kwargs={"window": 15},
    export=True,
)

print(clean.head())

                  time  ram_usage_GB  ram_utilization_percent  \
0  2025-08-17_21-45-25      7.876648                     49.5   
1  2025-08-17_21-45-26      7.578224                     47.6   
2  2025-08-17_21-45-27      7.842964                     49.3   
3  2025-08-17_21-45-28      7.843349                     49.3   
4  2025-08-17_21-45-29      7.816677                     49.1   

   cpu_utilization_percent  
0                     43.7  
1                     80.3  
2                     71.3  
3                     75.8  
4                     67.7  


In [3]:
df = pd.read_csv('data/temperature_2014_18.csv')

temp_mean = main(
    input_df=df,
    output_path="output/temperature_2014_18_mean_750",
    outlier_sensitivity_degree=None,
    value_column="Temperature",
    missing_value_function=None,            
    outlier_fn=None,
    time_column="datetime",
    rolling_fn=rolling_mean,                
    rolling_kwargs={"window": 750},
    export=True,
)

print(temp_mean.head())

   Unnamed: 0             datetime  Temperature
0           0  2014-01-01 06:00:00         9.44
1           1  2014-01-01 07:00:00        11.87
2           2  2014-01-01 08:00:00        14.55
3           3  2014-01-01 09:00:00        17.81
4           4  2014-01-01 10:00:00        21.96


In [4]:
temp_std = main(
    input_df=df,
    output_path="output/temperature_2014_18_std",
    outlier_sensitivity_degree=None,
    value_column="Temperature",
    missing_value_function=None,            
    outlier_fn=None,
    time_column="datetime",
    rolling_fn=rolling_std,                
    rolling_kwargs={"window": 500},
    export=True,
)

print(temp_std.head())

   Unnamed: 0             datetime  Temperature
0           0  2014-01-01 06:00:00         9.44
1           1  2014-01-01 07:00:00        11.87
2           2  2014-01-01 08:00:00        14.55
3           3  2014-01-01 09:00:00        17.81
4           4  2014-01-01 10:00:00        21.96
