## Compare Data Completeness Over Time

**Description**: Analyze the trend of missing data in `"sales_data.csv"` over several months stored in a "date" column. Visualize missing data rates by month.

In [None]:
# Write your code from here
import pandas as pd
import matplotlib.pyplot as plt

def plot_missing_data_trend(file_path):
    # Load data
    df = pd.read_csv(file_path)

    # Ensure 'date' column is in datetime format
    df['date'] = pd.to_datetime(df['date'], errors='coerce')

    # Drop rows where 'date' couldn't be parsed
    df = df.dropna(subset=['date'])

    # Extract month-year for grouping
    df['month'] = df['date'].dt.to_period('M')

    # Calculate missing value rate per month
    missing_rate_by_month = df.groupby('month').apply(
        lambda x: x.isna().sum().sum() / (x.shape[0] * x.shape[1]) * 100
    )

    # Plot
    missing_rate_by_month.plot(kind='line', marker='o', figsize=(10, 5), color='crimson')
    plt.title("Monthly Missing Data Rate in sales_data.csv")
    plt.xlabel("Month")
    plt.ylabel("Missing Data Rate (%)")
    plt.grid(True)
    plt.tight_layout()
    plt.show()

# Example usage:
plot_missing_data_trend("sales_data.csv")
