In [None]:
import pandas as pd
import matplotlib.pyplot as plt
from sklearn.linear_model import LinearRegression
from sklearn.model_selection import train_test_split
from sklearn.metrics import mean_squared_error, r2_score

# Sample dataset
data = {
    'Hours_Studied': [1, 2, 3, 4, 5, 6, 7, 8, 9, 10],
    'Marks_Obtained': [20, 25, 32, 35, 45, 50, 52, 60, 70, 85]
}
df = pd.DataFrame(data)

# Features and target
X = df[['Hours_Studied']]  # 2D array
y = df['Marks_Obtained']

# Train-test split
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=1)

# Train model
model = LinearRegression()
model.fit(X_train, y_train)

# Predict
y_pred = model.predict(X_test)

# Output results
print("🎯 Coefficient (Slope):", model.coef_[0])
print("📍 Intercept:", model.intercept_)
print("📈 Predicted values:", y_pred)
print("✅ R2 Score:", r2_score(y_test, y_pred))
print("🔍 Mean Squared Error:", mean_squared_error(y_test, y_pred))

# Visualize
plt.scatter(X, y, color='blue', label='Actual Data')
plt.plot(X, model.predict(X), color='red', label='Regression Line')
plt.xlabel("Hours Studied")
plt.ylabel("Marks Obtained")
plt.title("Simple Linear Regression")
plt.legend()
plt.grid(True)
plt.show()

# Predict for new value
sample = [[7.5]]  # e.g., 7.5 hours studied
predicted_marks = model.predict(sample)
print("📌 Predicted marks for 7.5 hours:", round(predicted_marks[0], 2))
