In [1]:
import pandas as pd 
import numpy as np

In [2]:

np.random.seed(42)
days = 90

dates = pd.date_range(end=pd.Timestamp.today(), periods=days)

data = []

for date in dates:
    is_weekend = date.weekday() >= 5

    sleep_hours = np.random.normal(7, 1.2)
    phone_usage = np.random.normal(5 if not is_weekend else 7, 1.5)
    study_hours = np.random.normal(4 if not is_weekend else 2, 1)
    exercise = np.random.normal(30, 10)
    mood = np.random.normal(3.5, 1)

    distractions = phone_usage * np.random.uniform(2, 4)
    caffeine = np.random.randint(0, 5)
    classes = 0 if is_weekend else np.random.randint(3, 6)
    social_media = phone_usage * np.random.uniform(0.4, 0.7)
    tasks_completed = study_hours * np.random.uniform(1, 2)

    # Burnout score logic
    burnout_score = (
        phone_usage * 0.5
        + distractions * 0.2
        - sleep_hours * 0.3
        - exercise * 0.1
        + caffeine * 0.2
    )

    # Productivity score logic
    productivity_score = (
        study_hours * 2
        + sleep_hours
        - phone_usage
        - distractions * 0.05
        + mood * 2
    )

    data.append([
        date,
        round(sleep_hours, 2),
        round(study_hours, 2),
        round(phone_usage, 2),
        round(social_media, 2),
        round(mood, 2),
        caffeine,
        round(exercise, 2),
        classes,
        round(distractions, 2),
        round(tasks_completed, 2),
        round(burnout_score, 2),
        round(productivity_score, 2),
    ])

columns = [
    "date",
    "sleep_hours",
    "study_hours",
    "phone_usage_hours",
    "social_media_hours",
    "mood",
    "caffeine_cups",
    "exercise_minutes",
    "classes_attended",
    "distractions",
    "tasks_completed",
    "burnout_score",
    "productivity_score",
]

df = pd.DataFrame(data, columns=columns)

# Create burnout level label
df["burnout_level"] = pd.cut(
    df["burnout_score"],
    bins=[-100, 2, 5, 100],
    labels=["Low", "Medium", "High"]
)

df.to_csv("student_behavior_extended.csv", index=False)

print("CSV created: student_behavior_extended.csv")

CSV created: student_behavior_extended.csv
