# LineRegression
#### by Joshua Rodriguez

##### 1. Choose a data from https://archive.ics.uci.edu
##### 2. Perform regression analysis on your chosen dataset

In [13]:
from ucimlrepo import fetch_ucirepo
import pandas as pd
from sklearn.linear_model import LinearRegression
from sklearn.model_selection import train_test_split
from sklearn.metrics import mean_squared_error, r2_score

In [None]:

# Fetch dataset
computer_hardware = fetch_ucirepo(id=29)

# Extract features and target from the dataset
X = pd.DataFrame(computer_hardware.data.features, columns=computer_hardware.variables['features'])
y = pd.Series(computer_hardware.data.targets, name="PRP")

# Check the shapes of X and y to ensure they are correctly loaded
print(X.shape)
print(y.shape)

# Split the data into training and testing sets
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)

# Initialize the Linear Regression model
model = LinearRegression()

# Train the model
model.fit(X_train, y_train)

# Make predictions
y_pred = model.predict(X_test)

# Evaluate the model
mse = mean_squared_error(y_test, y_pred)
r2 = r2_score(y_test, y_pred)

print(f"Mean Squared Error: {mse}")
print(f"R^2 Score: {r2}")

# Display coefficients
coefficients = pd.DataFrame(model.coef_, X.columns, columns=['Coefficient'])
print(coefficients)
