In [1]:
import logging

In [None]:
import logging

# Configure logging
logging.basicConfig(
    level=logging.INFO,
    format='%(asctime)s - %(levelname)s - %(message)s',
    handlers=[
        logging.FileHandler("eda_task_1.log"),
        logging.StreamHandler()
    ]
)

logging.info("Starting EDA for customer purchasing behavior.")

# Data loading
try:
    logging.info("Loading dataset...")
    train_data = eda.load_data('/content/drive/MyDrive/KIFIYA Projects/Rossmann-Pharmaceuticals/data/train.csv')
    store_data = eda.load_data('/content/drive/MyDrive/KIFIYA Projects/Rossmann-Pharmaceuticals/data/store.csv')
    sample_data = eda.load_data('/content/drive/MyDrive/KIFIYA Projects/Rossmann-Pharmaceuticals/data/sample_submission.csv')
    test_data = eda.load_data('/content/drive/MyDrive/KIFIYA Projects/Rossmann-Pharmaceuticals/data/test.csv')
    logging.info("Dataset loaded successfully.")
except Exception as e:
    logging.error(f"Error loading dataset: {e}")

# Data cleaning process
try:
    logging.info("Starting data cleaning process...")
    cleaned_store_data = eda.clean_data(store_data)
    cleaned_train_data = eda.clean_data(train_data)
    cleaned_test_data = eda.clean_data(test_data)
    cleaned_sample_data = eda.clean_data(sample_data)
    logging.info("Data cleaning completed successfully.")
except Exception as e:
    logging.error(f"Error during data cleaning: {e}")

# Visualization process
try:
    logging.info("Visualizing data...")
    eda.plot_promotion_distribution(cleaned_train_data, cleaned_test_data)
    eda.holiday_analysis(cleaned_train_data)
    eda.seasonal_analysis_with_holidays(cleaned_train_data)
    eda.customer_behavior_analysis(cleaned_train_data)
    eda.analyze_promotions(cleaned_train_data)
    eda.promo_effectiveness_analysis(cleaned_train_data, cleaned_store_data)
    eda.store_hours_analysis(cleaned_train_data)
    eda.store_opening_impact(cleaned_train_data)
    open_weekday_stores, weekend_sales_data = eda.analyze_weekday_open_stores(cleaned_train_data)
    assortment_sales_summary = eda.analyze_assortment_effect_on_sales(cleaned_store_data, cleaned_train_data)
    city_center_analysis = eda.analyze_competitor_distance_effect(cleaned_store_data, cleaned_train_data)
    sales_comparison = eda.analyze_new_competitors_effect(cleaned_store_data, cleaned_train_data)
    logging.info("Visualization completed successfully.")
except Exception as e:
    logging.error(f"Error during visualization: {e}")

logging.info("EDA completed successfully.")