In [None]:
# import libraries
import pandas as pd
import numpy as np
from scipy import stats

In [None]:
# Read the CSV file
df = pd.read_csv('fittrack_data.csv')

In [None]:
# Convert Date to datetime
df['Date'] = pd.to_datetime(df['Date'])

In [None]:
# Group data by date and whether the user has QuickLog
grouped = df.groupby(['Date', 'Has_QuickLog'])['Logged_Workout'].sum().unstack()

In [None]:
# Calculate daily active users for each group
results_a = grouped[0]  # Control group (without QuickLog)
results_b = grouped[1]  # Treatment group (with QuickLog)

In [None]:
# Calculate average daily active users
avg_dau_a = np.mean(results_a)
avg_dau_b = np.mean(results_b)

print(f"Average DAU for group A (without quick log): {avg_dau_a:.2f}")
print(f"Average DAU for group B (with quick log): {avg_dau_b:.2f}")

In [None]:
# Perform statistical test (t-test)
t_statistic, p_value = stats.ttest_ind(results_a, results_b)

print(f"T-statistic: {t_statistic:.4f}")
print(f"P-value: {p_value:.4f}")

In [None]:
# Interpret results
alpha = 0.05  # Significance level
if p_value < alpha:
    print("The difference is statistically significant.")
    if avg_dau_b > avg_dau_a:
        print("The quick log button improved daily active users.")
    else:
        print("The quick log button decreased daily active users.")
else:
    print("The difference is not statistically significant.")

In [None]:
# Calculate and print the percentage improvement
percent_improvement = ((avg_dau_b - avg_dau_a) / avg_dau_a) * 100
print(f"Percentage improvement: {percent_improvement:.2f}%")