In [1]:
import pandas as pd
from sklearn.linear_model import LinearRegression, Lasso
from sklearn.metrics import mean_squared_error
from math import sqrt

## Load the dataset into Python environment

In [2]:
df = pd.read_csv('car_age_price.csv')

## Check the basic details of the dataset

In [3]:
df.head()

Unnamed: 0,Year,Price
0,2018,465000
1,2019,755000
2,2019,700000
3,2018,465000
4,2018,465000


In [7]:
df.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 112 entries, 0 to 111
Data columns (total 2 columns):
 #   Column  Non-Null Count  Dtype
---  ------  --------------  -----
 0   Year    112 non-null    int64
 1   Price   112 non-null    int64
dtypes: int64(2)
memory usage: 1.9 KB


## Split the dataset into features (Year) and target variable (Price)

In [5]:
X = df['Year'].values.reshape(-1, 1)
y = df['Price']

## Create a Linear Regression model

In [6]:
linear_model = LinearRegression()
linear_model.fit(X, y)

## Create a Lasso Regression model

In [8]:
lasso_model = Lasso()
lasso_model.fit(X, y)

## Compare the performance of Linear Regression and Lasso Regression

In [9]:
linear_predictions = linear_model.predict(X)
lasso_predictions = lasso_model.predict(X)
linear_rmse = sqrt(mean_squared_error(y, linear_predictions))
lasso_rmse = sqrt(mean_squared_error(y, lasso_predictions))
print('Linear Regression RMSE:', linear_rmse)
print('Lasso Regression RMSE:', lasso_rmse)

Linear Regression RMSE: 57242.65163812557
Lasso Regression RMSE: 57242.651641444245


In [11]:
# The RMSE scores obtained for both Linear Regression and Lasso Regression are very close, with a difference in the 6th decimal place. This similarity is indeed unusual and suggests that both models are performing almost identically on the given dataset. If the dataset has very few features or if the features are not highly correlated, it’s possible that Lasso Regression does not provide a substantial advantage over Linear Regression. In this case, it seems that the Lasso model did not significantly penalize any features, resulting in similar predictions and RMSE scores compared to the Linear Regression model.