In [1]:
import pandas as pd
import numpy as np 

# --- PHASE 1: Loading ---
df = pd.read_csv('Data.csv')
print("Data Loaded Successfully!")

# --- PHASE 2: Cleaning ---
df['Subscription Date'] = pd.to_datetime(df['Subscription Date'])
df['Subscription Year'] = df['Subscription Date'].dt.year
df = df.drop(columns=['Index', 'Phone 1', 'Phone 2', 'Website'])

# --- PHASE 3: Analysis ---
# 1. Growth
unique_customers = df['Customer Id'].nunique()
print(f"Total Unique Customers: {unique_customers}")

# 2. Value Analysis (Tenure)
# Reference date fix ki hai
ref_date = pd.to_datetime("2023-01-01")
df['Active Days'] = (ref_date - df['Subscription Date']).dt.days

# 3. Segmentation
def get_segment(days):
    if days <= 365:
        return "New"
    elif days <= 730:
        return "Regular"
    else:
        return "Loyal"

df['Segment'] = df['Active Days'].apply(get_segment)

# Check Result
print("\nSegment Counts:")
print(df['Segment'].value_counts())

# --- PHASE 4: Export ---
loyal_customers = df[df['Segment'] == 'Loyal']
loyal_customers.to_csv('Loyal_Customers_List.csv', index=False)
print("\nFile 'Loyal_Customers_List.csv' has been saved!")

Data Loaded Successfully!
Total Unique Customers: 100000

Segment Counts:
Segment
Loyal      41898
Regular    41211
New        16891
Name: count, dtype: int64

File 'Loyal_Customers_List.csv' has been saved!
