In [1]:
# 1️⃣ House Price Prediction
import pandas as pd
import numpy as np

from sklearn.model_selection import train_test_split
from sklearn.preprocessing import StandardScaler
from sklearn.linear_model import LinearRegression, Ridge, Lasso
from sklearn.metrics import mean_squared_error, r2_score
df = pd.read_csv("/kaggle/input/california-housing-prices/housing.csv")

df = pd.get_dummies(df, drop_first=True)
df = df.dropna()
X = df.drop("median_house_value", axis=1)
y = df["median_house_value"]

X_train, X_test, y_train, y_test = train_test_split(
    X, y, test_size=0.2, random_state=42
)

scaler = StandardScaler()
X_train = scaler.fit_transform(X_train)
X_test = scaler.transform(X_test)

models = {
    "Linear Regression": LinearRegression(),
    "Ridge Regression": Ridge(alpha=1.0),
    "Lasso Regression": Lasso(alpha=0.01)
}

for name, model in models.items():
    model.fit(X_train, y_train)
    preds = model.predict(X_test)

    print(f"\n{name}")
    print("MSE:", mean_squared_error(y_test, preds))
    print("R2 Score:", r2_score(y_test, preds))



Linear Regression
MSE: 4802173538.60416
R2 Score: 0.6488402154431994

Ridge Regression
MSE: 4802177688.914903
R2 Score: 0.6488399119509963

Lasso Regression
MSE: 4802173566.343574
R2 Score: 0.6488402134147498


In [2]:
# 2 Student Marks Prediction
import pandas as pd
import numpy as np

df = pd.read_csv("/kaggle/input/students-performance-in-exams/StudentsPerformance.csv")
df = pd.get_dummies(df, drop_first=True)
X = df.drop("writing score", axis=1)
y = df["writing score"]
from sklearn.model_selection import train_test_split
from sklearn.preprocessing import StandardScaler

X_train, X_test, y_train, y_test = train_test_split(
    X, y, test_size=0.25, random_state=0
)

scaler = StandardScaler()
X_train = scaler.fit_transform(X_train)
X_test = scaler.transform(X_test)
from sklearn.linear_model import LinearRegression, Ridge, Lasso
from sklearn.metrics import mean_squared_error, r2_score

models = {
    "Linear Regression": LinearRegression(),
    "Ridge Regression": Ridge(alpha=1.0),
    "Lasso Regression": Lasso(alpha=0.05)
}

for name, model in models.items():
    model.fit(X_train, y_train)
    preds = model.predict(X_test)

    print(f"\n{name}")
    print("MSE:", mean_squared_error(y_test, preds))
    print("R2 Score:", r2_score(y_test, preds))




Linear Regression
MSE: 12.147579105754687
R2 Score: 0.9451637327114657

Ridge Regression
MSE: 12.167819395307738
R2 Score: 0.9450723645533935

Lasso Regression
MSE: 12.0286584110402
R2 Score: 0.9457005612387573


In [3]:
# 3 Salary Prediction
import pandas as pd
import numpy as np

df = pd.read_csv("/kaggle/input/salary/Salary.csv")
df.head()
X = df[['YearsExperience']]
y = df['Salary']
from sklearn.model_selection import train_test_split

X_train, X_test, y_train, y_test = train_test_split(
    X, y, test_size=0.2, random_state=1
)
from sklearn.preprocessing import StandardScaler
from sklearn.linear_model import LinearRegression, Ridge, Lasso
from sklearn.metrics import mean_squared_error, r2_score

scaler = StandardScaler()
X_train = scaler.fit_transform(X_train)
X_test = scaler.transform(X_test)

models = {
    "Linear Regression": LinearRegression(),
    "Ridge Regression": Ridge(alpha=0.5),
    "Lasso Regression": Lasso(alpha=0.01)
}

for name, model in models.items():
    model.fit(X_train, y_train)
    preds = model.predict(X_test)

    print(f"\n{name}")
    print("MSE:", mean_squared_error(y_test, preds))
    print("R2 Score:", r2_score(y_test, preds))



Linear Regression
MSE: 40308108.63707037
R2 Score: 0.9593108462602296

Ridge Regression
MSE: 41341667.492050745
R2 Score: 0.9582675168515477

Lasso Regression
MSE: 40308121.21303574
R2 Score: 0.9593108335653796


In [4]:
# 4 Car Price Prediction
import pandas as pd
import numpy as np

df = pd.read_csv("/kaggle/input/vehicle-dataset-from-cardekho/car data.csv")
df = df.drop(['Car_Name'], axis=1)
df = pd.get_dummies(df, drop_first=True)
X = df.drop("Selling_Price", axis=1)
y = df["Selling_Price"]
from sklearn.model_selection import train_test_split
from sklearn.preprocessing import StandardScaler

X_train, X_test, y_train, y_test = train_test_split(
    X, y, test_size=0.2, random_state=42
)

scaler = StandardScaler()
X_train = scaler.fit_transform(X_train)
X_test = scaler.transform(X_test)
from sklearn.linear_model import LinearRegression, Ridge, Lasso
from sklearn.metrics import mean_squared_error, r2_score

models = {
    "Linear Regression": LinearRegression(),
    "Ridge Regression": Ridge(alpha=1.0),
    "Lasso Regression": Lasso(alpha=0.05)
}

for name, model in models.items():
    model.fit(X_train, y_train)
    preds = model.predict(X_test)

    print(f"\n{name}")
    print("MSE:", mean_squared_error(y_test, preds))
    print("R2 Score:", r2_score(y_test, preds))




Linear Regression
MSE: 3.4788039706379044
R2 Score: 0.8489813024899066

Ridge Regression
MSE: 3.4897217349606047
R2 Score: 0.8485073503610563

Lasso Regression
MSE: 3.5160369713153825
R2 Score: 0.8473649770762978


In [5]:
# 5 Medical Insurance Cost Prediction
import pandas as pd
import numpy as np

df = pd.read_csv("/kaggle/input/insurance/insurance.csv")
df = pd.get_dummies(df, drop_first=True)
X = df.drop("charges", axis=1)
y = df["charges"]
from sklearn.model_selection import train_test_split
from sklearn.preprocessing import StandardScaler

X_train, X_test, y_train, y_test = train_test_split(
    X, y, test_size=0.25, random_state=10
)

scaler = StandardScaler()
X_train = scaler.fit_transform(X_train)
X_test = scaler.transform(X_test)
from sklearn.linear_model import LinearRegression, Ridge, Lasso
from sklearn.metrics import mean_squared_error, r2_score

models = {
    "Linear Regression": LinearRegression(),
    "Ridge Regression": Ridge(alpha=1.5),
    "Lasso Regression": Lasso(alpha=0.1)
}

for name, model in models.items():
    model.fit(X_train, y_train)
    preds = model.predict(X_test)

    print(f"\n{name}")
    print("MSE:", mean_squared_error(y_test, preds))
    print("R2 Score:", r2_score(y_test, preds))



Linear Regression
MSE: 38150907.33079195
R2 Score: 0.7162745306503484

Ridge Regression
MSE: 38124574.96203128
R2 Score: 0.7164703625245665

Lasso Regression
MSE: 38150568.27679471
R2 Score: 0.7162770521697888


In [6]:
# 6 Sales Prediction
import pandas as pd
import numpy as np

df = pd.read_csv("/kaggle/input/advertising-dataset/advertising.csv")
X = df[['TV', 'Radio', 'Newspaper']]
y = df['Sales']
from sklearn.model_selection import train_test_split
from sklearn.preprocessing import StandardScaler

X_train, X_test, y_train, y_test = train_test_split(
    X, y, test_size=0.2, random_state=5
)

scaler = StandardScaler()
X_train = scaler.fit_transform(X_train)
X_test = scaler.transform(X_test)
from sklearn.linear_model import LinearRegression, Ridge, Lasso
from sklearn.metrics import mean_squared_error, r2_score

models = {
    "Linear Regression": LinearRegression(),
    "Ridge Regression": Ridge(alpha=1.0),
    "Lasso Regression": Lasso(alpha=0.05)
}

for name, model in models.items():
    model.fit(X_train, y_train)
    preds = model.predict(X_test)

    print(f"\n{name}")
    print("MSE:", mean_squared_error(y_test, preds))
    print("R2 Score:", r2_score(y_test, preds))




Linear Regression
MSE: 1.8741138418894405
R2 Score: 0.9217965732000768

Ridge Regression
MSE: 1.858064939659836
R2 Score: 0.9224662652554252

Lasso Regression
MSE: 1.8650661354232583
R2 Score: 0.9221741178478565


In [7]:
# 7 Temperature Prediction
import pandas as pd
import numpy as np

df = pd.read_csv("/kaggle/input/szeged-weather/weatherHistory.csv")
df = df[['Temperature (C)', 'Humidity', 'Wind Speed (km/h)', 'Pressure (millibars)']]
df = df.dropna()
X = df[['Humidity', 'Wind Speed (km/h)', 'Pressure (millibars)']]
y = df['Temperature (C)']
from sklearn.model_selection import train_test_split
from sklearn.preprocessing import StandardScaler

X_train, X_test, y_train, y_test = train_test_split(
    X, y, test_size=0.2, random_state=3
)

scaler = StandardScaler()
X_train = scaler.fit_transform(X_train)
X_test = scaler.transform(X_test)
from sklearn.linear_model import LinearRegression, Ridge, Lasso
from sklearn.metrics import mean_squared_error, r2_score

models = {
    "Linear Regression": LinearRegression(),
    "Ridge Regression": Ridge(alpha=0.8),
    "Lasso Regression": Lasso(alpha=0.02)
}

for name, model in models.items():
    model.fit(X_train, y_train)
    preds = model.predict(X_test)

    print(f"\n{name}")
    print("MSE:", mean_squared_error(y_test, preds))
    print("R2 Score:", r2_score(y_test, preds))




Linear Regression
MSE: 52.63293939633518
R2 Score: 0.421808847180866

Ridge Regression
MSE: 52.63294646016598
R2 Score: 0.4218087695822268

Lasso Regression
MSE: 52.64143637347728
R2 Score: 0.42171550493044985


In [8]:
# 8 Gold Price Prediction
import pandas as pd
import numpy as np

df = pd.read_csv("/kaggle/input/gold-price-data/gld_price_data.csv")
df = df.select_dtypes(include=[np.number])
df = df.dropna()

X = df.drop("GLD", axis=1)
y = df["GLD"]

from sklearn.model_selection import train_test_split
from sklearn.preprocessing import StandardScaler

X_train, X_test, y_train, y_test = train_test_split(
    X, y, test_size=0.2, random_state=7
)

scaler = StandardScaler()
X_train = scaler.fit_transform(X_train)
X_test = scaler.transform(X_test)
from sklearn.linear_model import LinearRegression, Ridge, Lasso
from sklearn.metrics import mean_squared_error, r2_score

models = {
    "Linear Regression": LinearRegression(),
    "Ridge Regression": Ridge(alpha=1.0),
    "Lasso Regression": Lasso(alpha=0.05)
}

for name, model in models.items():
    model.fit(X_train, y_train)
    preds = model.predict(X_test)

    print(f"\n{name}")
    print("MSE:", mean_squared_error(y_test, preds))
    print("R2 Score:", r2_score(y_test, preds))




Linear Regression
MSE: 67.49390270882927
R2 Score: 0.872559361969998

Ridge Regression
MSE: 67.48047567638011
R2 Score: 0.8725847146242895

Lasso Regression
MSE: 67.44125995614117
R2 Score: 0.8726587609634029


In [9]:
# 9 Electricity Consumption Prediction

import pandas as pd
import numpy as np

df = pd.read_csv(
    "/kaggle/input/electric-power-consumption-data-set/household_power_consumption.txt",
    sep=';',
    na_values='?',
    low_memory=False
)
df = df[['Global_active_power',
         'Voltage',
         'Global_intensity',
         'Sub_metering_1',
         'Sub_metering_2',
         'Sub_metering_3']]

df = df.dropna()
X = df.drop("Global_active_power", axis=1)
y = df["Global_active_power"]

from sklearn.model_selection import train_test_split
from sklearn.preprocessing import StandardScaler

X_train, X_test, y_train, y_test = train_test_split(
    X, y, test_size=0.2, random_state=9
)

scaler = StandardScaler()
X_train = scaler.fit_transform(X_train)
X_test = scaler.transform(X_test)

from sklearn.linear_model import LinearRegression, Ridge, Lasso
from sklearn.metrics import mean_squared_error, r2_score

models = {
    "Linear Regression": LinearRegression(),
    "Ridge Regression": Ridge(alpha=1.2),
    "Lasso Regression": Lasso(alpha=0.05)
}

for name, model in models.items():
    model.fit(X_train, y_train)
    preds = model.predict(X_test)

    print(f"\n{name}")
    print("MSE:", mean_squared_error(y_test, preds))
    print("R2 Score:", r2_score(y_test, preds))




Linear Regression
MSE: 0.00202493625803658
R2 Score: 0.9981913168318708

Ridge Regression
MSE: 0.0020249363013582554
R2 Score: 0.9981913167931757

Lasso Regression
MSE: 0.0050080475063659195
R2 Score: 0.9955267869820563


In [10]:

# 10 Flight Fare Prediction

import pandas as pd
import numpy as np

# Load dataset
df = pd.read_csv("/kaggle/input/flight-price-prediction/Clean_Dataset.csv")

# Safely drop columns if they exist
df = df.drop(columns=['Unnamed: 0', 'flight_no'], errors='ignore')

# Keep only numeric columns
df = df.select_dtypes(include=[np.number])

# Remove missing values
df = df.dropna()

# Feature-target split
X = df.drop("price", axis=1)
y = df["price"]

# Train-test split
from sklearn.model_selection import train_test_split
from sklearn.preprocessing import StandardScaler

X_train, X_test, y_train, y_test = train_test_split(
    X, y, test_size=0.2, random_state=11
)

# Scaling
scaler = StandardScaler()
X_train = scaler.fit_transform(X_train)
X_test = scaler.transform(X_test)

# Regression models
from sklearn.linear_model import LinearRegression, Ridge, Lasso
from sklearn.metrics import mean_squared_error, r2_score

models = {
    "Linear Regression": LinearRegression(),
    "Ridge Regression": Ridge(alpha=1.0),
    "Lasso Regression": Lasso(alpha=0.1)
}

for name, model in models.items():
    model.fit(X_train, y_train)
    preds = model.predict(X_test)

    print(f"\n{name}")
    print("MSE:", mean_squared_error(y_test, preds))
    print("R2 Score:", r2_score(y_test, preds))




Linear Regression
MSE: 491243687.57254004
R2 Score: 0.04690829475302538

Ridge Regression
MSE: 491243682.8569667
R2 Score: 0.04690830390199563

Lasso Regression
MSE: 491243644.54257107
R2 Score: 0.04690837823808103
