# Logit Model using SciKit Learn (Machine Learning)

In [1]:
# Import
import pandas as pd
import os
from sklearn.linear_model import LogisticRegression
from sklearn.model_selection import train_test_split

In [2]:
# Load cleaned data
listings_df = pd.read_csv(os.path.join('data', 'yvr_listing_data_cleaned.csv'))

In [3]:
# Split the data into independent variables (X) and dependent variable (y)
X = listings_df.drop('legal_listing', axis=1)
y = listings_df['legal_listing']

# Split the data into training and testing sets
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)

# Create and fit the logistic regression model
logit_model = LogisticRegression(max_iter=10000)
logit_model.fit(X_train, y_train)

# Print the accuracy score
print(f'Accuracy: {logit_model.score(X_test, y_test)}')


Accuracy: 0.9065550906555091


```python
# To test on a new listing, use the following code:
new_listing = [[1, 1, 1, 1, 1, 1, 1, 1, 1, 1]] # Fill columns with proper values
print(logit_model.predict(new_listing))
print(logit_model.predict_proba(new_listing))

# To save the model, use the following code:
import pickle
with open('model.pkl', 'wb') as f:
    pickle.dump(logit_model, f)

# To load the model, use the following code:
import pickle
with open('model.pkl', 'rb') as f:
    logit_model = pickle.load(f)
```