# FDCS_1

In [3]:
from lags_identifier import find_top_correlated_lags
"""
This script identifies the top correlated lags for specified columns in a DataFrame.

Modules:
    lags_identifier: Contains the function `find_top_correlated_lags` to find the top correlated lags.
    pandas: Used for data manipulation and analysis.

Functions:
    find_top_correlated_lags(df, columns, lag_range): Identifies the top correlated lags for the specified columns within the given lag range.

Variables:
    df (pd.DataFrame): The DataFrame containing the data read from a CSV file.
    columns (list of str): The list of column names for which to find the top correlated lags.
    lag_range (tuple of int): The range of lags to consider for correlation analysis.

Usage:
    The script reads a CSV file into a DataFrame, specifies the columns of interest, and the lag range.
    It then calls `find_top_correlated_lags` to find the top correlated lags for the specified columns and prints the result.
"""
import pandas as pd
df = pd.read_csv(r'.csv')

columns = ['Electricity Consumption',
           'Humidity Closer to Evaporator (%)',
           'Temperature Closer to Evaporator (C)']
lag_range = (168, 336)  # one week of data (0-167 one week back where zero is inclusive)

strong_lags = find_top_correlated_lags(df, columns, lag_range)
print(strong_lags)

{'Electricity Consumption': [168, 192, 216, 264, 240, 288, 336, 312, 215, 263], 'Humidity Closer to Evaporator (%)': [168, 192, 169, 191, 216, 170, 240, 264, 193, 171], 'Temperature Closer to Evaporator (C)': [168, 192, 216, 240, 264, 288, 312, 336, 191, 215]}


# FDCS_2

In [4]:
from lags_identifier import find_top_correlated_lags
"""
This script reads a CSV file into a pandas DataFrame, selects specific columns related to 
electricity consumption, humidity, and temperature, and identifies the top correlated lags 
within a specified range using the `find_top_correlated_lags` function from the 
`lags_identifier` module.

Modules:
    lags_identifier: Contains the `find_top_correlated_lags` function.
    pandas: Used for data manipulation and analysis.

Functions:
    find_top_correlated_lags(df, columns, lag_range): Identifies the top correlated lags 
    for the specified columns within the given lag range.

Variables:
    df (pd.DataFrame): The DataFrame containing the data read from the CSV file.
    columns (list of str): The list of column names to be analyzed for lag correlation.
    lag_range (tuple of int): The range of lags to be considered for correlation analysis.
    strong_lags (dict): The dictionary containing the top correlated lags for each column.

Usage:
    The script reads data from a CSV file, identifies the top correlated lags for the 
    specified columns within the given lag range, and prints the results.
"""
import pandas as pd
df = pd.read_csv(r'.csv')

columns = ['Electricity Consumption',
           'Humidity Closer to Evaporator (%)',
           'Temperature Closer to Evaporator (C)']
lag_range = (168, 336)  # one week of data

strong_lags = find_top_correlated_lags(df, columns, lag_range)
print(strong_lags)

{'Electricity Consumption': [168, 169, 261, 264, 335, 243, 242, 336, 241, 186], 'Humidity Closer to Evaporator (%)': [168, 261, 169, 264, 336, 263, 178, 242, 243, 335], 'Temperature Closer to Evaporator (C)': [168, 169, 185, 264, 186, 263, 184, 218, 187, 188]}
