In [2]:
# Import necessary libraries
import numpy as np
import matplotlib.pyplot as plt
from sklearn.linear_model import LinearRegression

# Example data: Hours studied vs. Marks scored
hours = np.array([1, 2, 3, 4, 5, 6, 7, 8, 9]).reshape(-1, 1)  # Feature (X)
marks = np.array([35, 40, 50, 55, 65, 70, 75, 80, 85])       # Target (Y)

# Create and train the model
model = LinearRegression()
model.fit(hours, marks)

# Predict using the model
predicted_marks = model.predict(hours)

# Print model coefficients
print("Slope (m):", model.coef_[0])
print("Intercept (b):", model.intercept_)

# Plotting the regression line
plt.scatter(hours, marks, color='blue', label='Actual Marks')
plt.plot(hours, predicted_marks, color='red', label='Regression Line')
plt.title("Simple Linear Regression: Hours vs Marks")
plt.xlabel("Hours Studied")
plt.ylabel("Marks Scored")
plt.legend()
plt.grid(True)
plt.show()

In [2]:
# Import necessary libraries
import numpy as np
from sklearn.linear_model import LinearRegression

# Example input data: [English, Science, History]
X = np.array([
    [70, 90, 74],
    [60, 85, 65],
    [80, 88, 78],
    [90, 95, 82],
    [75, 80, 72]
])

# Target: Final marks (e.g., overall performance or a math score)
y = np.array([80, 70, 85, 95, 78])  # Just example values

# Create and train the model
model = LinearRegression()
model.fit(X, y)

# Print model coefficients and intercept
print("Coefficients:", model.coef_)
print("Intercept:", model.intercept_)

# Predicting for a new student
new_student = np.array([[70, 90, 74]])  # English, Science, History
predicted_score = model.predict(new_student)
print("Predicted Final Score:", predicted_score[0])

In [None]:
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
from sklearn.linear_model import LinearRegression
from sklearn.metrics import mean_squared_error, r2_score

df = pd.read_csv("/content/sample_data/california_housing_train.csv")
df = df.head(100)

X = df['AveRooms'].values.reshape(-1, 1)
y = df['HouseAge'].values.reshape(-1, 1)

model = LinearRegression()
model.fit(X, y)
y_pred = model.predict(X)

plt.scatter(X, y, color='blue', label='Actual')
plt.plot(X, y_pred, color='red', linewidth=2, label='Predicted')
plt.xlabel("Average Rooms")
plt.ylabel("House Age")
plt.title("Linear Regression: Average Rooms vs House Age")
plt.legend()
plt.show()

mse = mean_squared_error(y, y_pred)
r2 = r2_score(y, y_pred)

print("Mean Squared Error:", mse)
print("R2 Score:", r2)


In [None]:
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
from sklearn.linear_model import LogisticRegression
from sklearn.model_selection import train_test_split
from sklearn.metrics import classification_report, confusion_matrix

df = pd.read_csv('/content/sample_data/california_housing_train.csv')
df = df.head(100)

df['HighAveRooms'] = (df['AveRooms'] > df['AveRooms'].mean()).astype(int)

X = df[['HouseAge']]
y = df['HighAveRooms']

X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)

model = LogisticRegression()
model.fit(X_train, y_train)

y_pred = model.predict(X_test)

print(confusion_matrix(y_test, y_pred))
print(classification_report(y_test, y_pred))

plt.scatter(X, y, color='blue', label='Data')
plt.plot(X, model.predict_proba(X)[:,1], color='red', label='Logistic Regression Curve')
plt.xlabel("House Age")
plt.ylabel("Probability of High Average Rooms")
plt.title("Logistic Regression")
plt.legend()
plt.show()


In [None]:
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns

df = pd.read_csv("/content/sample_data/california_housing_train.csv")
df = df.head(100)

corr = df.corr()

plt.figure(figsize=(10, 8))
sns.heatmap(corr, annot=True, cmap='coolwarm')
plt.title("Correlation Heatmap")
plt.show()

sns.pairplot(df[['AveRooms', 'HouseAge', 'AveOccup']])
plt.suptitle("Pairplot of Selected Features", y=1.02)
plt.show()
