# Carbon Footprint & Recycling Prediction

This notebook demonstrates a simple machine learning workflow with a toy dataset.
- Regression: predict numeric carbon footprint
- Classification: high vs low carbon footprint


In [None]:
import pandas as pd
from sklearn.model_selection import train_test_split
from sklearn.linear_model import LinearRegression, LogisticRegression
from sklearn.metrics import mean_squared_error, accuracy_score

# Dummy dataset
data = pd.DataFrame({
    'recycles_regularly': [0,1,0,1,1,0,1,0],
    'carbon_footprint':   [140,80,150,75,90,160,85,155]
})
print(data)

In [None]:
X = data[['recycles_regularly']]
y_reg = data['carbon_footprint']

X_train, X_test, y_train, y_test = train_test_split(X, y_reg, test_size=0.25, random_state=42)

reg_model = LinearRegression()
reg_model.fit(X_train, y_train)

reg_pred = reg_model.predict(X_test)
rmse = (mean_squared_error(y_test, reg_pred)) ** 0.5
print('Test RMSE (Regression):', rmse)

In [None]:
threshold = 120
y_clf = (data['carbon_footprint'] > threshold).astype(int)

X_train_c, X_test_c, y_train_c, y_test_c = train_test_split(X, y_clf, test_size=0.25, random_state=42)

clf_model = LogisticRegression()
clf_model.fit(X_train_c, y_train_c)

clf_pred = clf_model.predict(X_test_c)
acc = accuracy_score(y_test_c, clf_pred)
print('Test Accuracy (Classification):', acc)
print('Predicted:', clf_pred)
print('True:', y_test_c.to_list())