In [7]:
# Import libraries
import pandas as pd
from sklearn.model_selection import train_test_split
from sklearn.linear_model import LinearRegression
from sklearn.metrics import mean_squared_error
# Load the data (assuming the file is already uploaded)
data = pd.read_csv('cleaned_real_estate_data.csv')

# Display the first few rows
print(data.head())

# Step 1: Data Cleaning (if needed)
print(data.isnull().sum()) # Check for missing values

# Step 2: Feature Selection
# Use the correct column names from your dataset
X = data[['beds', 'baths', 'sqft', 'year_built']]
y = data['tx_price'] # Target column

# Step 3: Split the data into training and test sets
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)

# Step 4: Model Training
# Using Linear Regression
model = LinearRegression()
model.fit(X_train, y_train)

# Step 5: Model Evaluation
# Make predictions on the test set
y_pred = model.predict(X_test)

   tx_price  beds  baths  sqft  year_built
0    295850     1      1   584        2013
1    216500     1      1   612        1965
2    279900     1      1   615        1963
3    379900     1      1   618        2000
4    340000     1      1   634        1992
tx_price      0
beds          0
baths         0
sqft          0
year_built    0
dtype: int64


In [8]:
# Calculate Mean Squared Error (MSE) for evaluation
mse = mean_squared_error(y_test, y_pred)
print(f'Mean Squared Error: {mse}')

Mean Squared Error: 17957350951.99832


In [None]:
# Step 6: User Input for Prediction
def predict_tax_price():
  print("Enter property details:")
  beds = float(input("Number of bedrooms: "))
  baths = float(input("Number of bathrooms: "))
  sqft = float(input("Square footage: "))
  year_built = int(input("Year built: "))
  # Create a dataframe for the input
  input_data = pd.DataFrame([[beds, baths, sqft, year_built]], columns=['beds', 'baths', 'sqft', 'year_built'])
  # Predict the tax price
  predicted_tax_price = model.predict(input_data)
  print(f"Predicted Tax Price: ${predicted_tax_price[0]:,.2f}")

userIn = 'c'
while userIn != 'q':
  # Call the prediction function
  predict_tax_price()
  userIn = input("Enter 'q' to quit. To continue, enter any other key: ")


: 