In [1]:
import numpy as np
import pandas as pd
from sklearn.model_selection import train_test_split
from sklearn.linear_model import LinearRegression
from sklearn.metrics import mean_squared_error

# Sample data creation
# Assuming you have a DataFrame `df` with columns 'SquareFootage', 'Bedrooms', 'Bathrooms', 'Price'
data = {
    'SquareFootage': [1000, 1500, 2000, 2500, 3000, 3500],
    'Bedrooms': [3, 2, 3, 4, 3, 5],
    'Bathrooms': [2, 1, 2, 3, 2, 4],
    'Price': [200000, 250000, 300000, 350000, 400000, 450000]
}

df = pd.DataFrame(data)

# Feature matrix and target array
X = df[['SquareFootage', 'Bedrooms', 'Bathrooms']]
y = df['Price']

# Splitting the dataset into training and testing sets
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)

# Creating and training the Linear Regression model
model = LinearRegression()
model.fit(X_train, y_train)

# Making predictions
predictions = model.predict(X_test)

# Evaluating the model
mse = mean_squared_error(y_test, predictions)
print("Mean Squared Error:", mse)

# Example of making a prediction
# Predict the price of a house with 2000 square feet, 3 bedrooms, and 2 bathrooms
example_features = np.array([[2000, 3, 2]])  # The input should match the feature order
predicted_price = model.predict(example_features)
print(f"Predicted price for a house with 2000 square feet, 3 bedrooms, and 2 bathrooms: ${predicted_price[0]:.2f}")

Mean Squared Error: 3.3881317890172014e-21
Predicted price for a house with 2000 square feet, 3 bedrooms, and 2 bathrooms: $300000.00




In [3]:
import pandas as pd

# Creating a synthetic dataset
data = {
    'SquareFootage': [1000, 1500, 2000, 2500, 3000, 3500, 4000, 4500],
    'Bedrooms': [2, 3, 2, 4, 3, 5, 4, 5],
    'Bathrooms': [1, 2, 2, 3, 2, 4, 3, 4],
    'Price': [200000, 250000, 300000, 350000, 400000, 450000, 500000, 550000]
}

df = pd.DataFrame(data)

# Saving the dataset to a CSV file
df.to_csv(r'C:\Users\Solomon\Downloads\Solomon.csv', index=False)
print(data)

{'SquareFootage': [1000, 1500, 2000, 2500, 3000, 3500, 4000, 4500], 'Bedrooms': [2, 3, 2, 4, 3, 5, 4, 5], 'Bathrooms': [1, 2, 2, 3, 2, 4, 3, 4], 'Price': [200000, 250000, 300000, 350000, 400000, 450000, 500000, 550000]}


In [4]:
import pandas as pd
from sklearn.model_selection import train_test_split
from sklearn.linear_model import LinearRegression
from sklearn.metrics import mean_squared_error

# Load the dataset
df = pd.read_csv(r'C:\Users\Solomon\Downloads\Solomon.csv')

# Separate features and target variable
X = df[['SquareFootage', 'Bedrooms', 'Bathrooms']]
y = df['Price']

# Split the data into training and testing sets
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)

# Initialize and train the Linear Regression model
model = LinearRegression()
model.fit(X_train, y_train)

# Make predictions and evaluate the model
predictions = model.predict(X_test)
mse = mean_squared_error(y_test, predictions)
print("Mean Squared Error:", mse)

# Example prediction
example_features = [[2000, 3, 2]]  # 2000 sqft, 3 bedrooms, 2 bathrooms
predicted_price = model.predict(example_features)
print(f"Predicted price for a house with 2000 square feet, 3 bedrooms, and 2 bathrooms: ${predicted_price[0]:,.2f}")

Mean Squared Error: 8.470329472543003e-21
Predicted price for a house with 2000 square feet, 3 bedrooms, and 2 bathrooms: $300,000.00


