In [1]:
import pandas as pd
from sklearn.model_selection import train_test_split
from sklearn.linear_model import LinearRegression
from sklearn.metrics import mean_squared_error
import numpy as np

# Load data
data = pd.read_csv('cleaned_train.csv')

# Pilih fitur yang akan digunakan
features = ['Engine Size(L)', 'Cylinders', 'Fuel Consumption City (L/100km)', 'Fuel Consumption Hwy (L/100km)', 'Fuel Consumption Comb (L/100km)']

# Pilih target
target = 'CO2 Emissions(g/km)'

# Pisahkan data menjadi data training dan data testing
train_data, test_data = train_test_split(data, test_size=0.2, random_state=42)

# Inisialisasi model regresi linear
model = LinearRegression()

# Latih model menggunakan data training
model.fit(train_data[features], train_data[target])

# Lakukan prediksi pada data testing
predictions = model.predict(test_data[features])

# Hitung Root Mean Squared Error (RMSE)
rmse = np.sqrt(mean_squared_error(test_data[target], predictions))
print("RMSE:", rmse)

# Jika RMSE kurang dari atau sama dengan 15, maka berlangganan GPT-4
if rmse <= 15:
    print("Anda dapat berlangganan GPT-4!")
else:
    print("Maaf, RMSE melebihi 15. Coba tuning model atau fitur lainnya.")


RMSE: 35.55975489227126
Maaf, RMSE melebihi 15. Coba tuning model atau fitur lainnya.


In [2]:
import pandas as pd
from sklearn.model_selection import train_test_split
from sklearn.preprocessing import StandardScaler, PolynomialFeatures
from sklearn.linear_model import Lasso
from sklearn.metrics import mean_squared_error
import numpy as np

# Load data
data = pd.read_csv('cleaned_train.csv')

# Pilih fitur yang akan digunakan
features = ['Engine Size(L)', 'Cylinders', 'Fuel Consumption City (L/100km)', 'Fuel Consumption Hwy (L/100km)', 'Fuel Consumption Comb (L/100km)']

# Pilih target
target = 'CO2 Emissions(g/km)'

# Pisahkan data menjadi data training dan data testing
train_data, test_data = train_test_split(data, test_size=0.2, random_state=42)

# Normalisasi atau scaling fitur
scaler = StandardScaler()
train_data_scaled = scaler.fit_transform(train_data[features])
test_data_scaled = scaler.transform(test_data[features])

# Menambahkan fitur interaksi
poly = PolynomialFeatures(degree=2, interaction_only=True)
train_data_poly = poly.fit_transform(train_data_scaled)
test_data_poly = poly.transform(test_data_scaled)

# Inisialisasi model Lasso Regression
lasso_model = Lasso(alpha=0.1, max_iter=10000)

# Latih model menggunakan data training yang sudah diubah
lasso_model.fit(train_data_poly, train_data[target])

# Lakukan prediksi pada data testing yang sudah diubah
predictions_lasso = lasso_model.predict(test_data_poly)

# Hitung Root Mean Squared Error (RMSE)
rmse_lasso = np.sqrt(mean_squared_error(test_data[target], predictions_lasso))
print("RMSE (Lasso Regression):", rmse_lasso)

# Jika RMSE kurang dari atau sama dengan 15, maka berlangganan GPT-4
if rmse_lasso <= 15:
    print("Anda dapat berlangganan GPT-4!")
else:
    print("Maaf, RMSE masih tinggi. Coba tuning model atau fitur lainnya.")


RMSE (Lasso Regression): 35.18132063669722
Maaf, RMSE masih tinggi. Coba tuning model atau fitur lainnya.


In [3]:
import pandas as pd
from sklearn.model_selection import train_test_split
from sklearn.preprocessing import StandardScaler, PolynomialFeatures
from sklearn.linear_model import ElasticNet
from sklearn.metrics import mean_squared_error
import numpy as np

# Load data
data = pd.read_csv('cleaned_train.csv')

# Pilih fitur yang akan digunakan
features = ['Engine Size(L)', 'Cylinders', 'Fuel Consumption City (L/100km)', 'Fuel Consumption Hwy (L/100km)', 'Fuel Consumption Comb (L/100km)']

# Pilih target
target = 'CO2 Emissions(g/km)'

# Pisahkan data menjadi data training dan data testing
train_data, test_data = train_test_split(data, test_size=0.2, random_state=42)

# Normalisasi atau scaling fitur
scaler = StandardScaler()
train_data_scaled = scaler.fit_transform(train_data[features])
test_data_scaled = scaler.transform(test_data[features])

# Menambahkan fitur interaksi
poly = PolynomialFeatures(degree=2, interaction_only=True)
train_data_poly = poly.fit_transform(train_data_scaled)
test_data_poly = poly.transform(test_data_scaled)

# Inisialisasi model ElasticNet Regression
elasticnet_model = ElasticNet(alpha=0.01, l1_ratio=0.5, max_iter=10000)

# Latih model menggunakan data training yang sudah diubah
elasticnet_model.fit(train_data_poly, train_data[target])

# Lakukan prediksi pada data testing yang sudah diubah
predictions_elasticnet = elasticnet_model.predict(test_data_poly)

# Hitung Root Mean Squared Error (RMSE)
rmse_elasticnet = np.sqrt(mean_squared_error(test_data[target], predictions_elasticnet))
print("RMSE (ElasticNet Regression):", rmse_elasticnet)

# Jika RMSE kurang dari atau sama dengan 15, maka berlangganan GPT-4
if rmse_elasticnet <= 15:
    print("Anda dapat berlangganan GPT-4!")
else:
    print("Maaf, RMSE masih tinggi. Coba tuning model atau fitur lainnya.")


RMSE (ElasticNet Regression): 35.17909689697249
Maaf, RMSE masih tinggi. Coba tuning model atau fitur lainnya.


In [4]:
import pandas as pd
from sklearn.model_selection import train_test_split
from sklearn.ensemble import RandomForestRegressor
from sklearn.metrics import mean_squared_error
import numpy as np

# Load data
data = pd.read_csv('cleaned_train.csv')

# Pilih fitur yang akan digunakan
features = ['Engine Size(L)', 'Cylinders', 'Fuel Consumption City (L/100km)', 'Fuel Consumption Hwy (L/100km)', 'Fuel Consumption Comb (L/100km)']

# Pilih target
target = 'CO2 Emissions(g/km)'

# Pisahkan data menjadi data training dan data testing
train_data, test_data = train_test_split(data, test_size=0.2, random_state=42)

# Inisialisasi model Random Forest Regressor
random_forest_model = RandomForestRegressor(n_estimators=100, random_state=42)

# Latih model menggunakan data training
random_forest_model.fit(train_data[features], train_data[target])

# Lakukan prediksi pada data testing
predictions_random_forest = random_forest_model.predict(test_data[features])

# Hitung Root Mean Squared Error (RMSE)
rmse_random_forest = np.sqrt(mean_squared_error(test_data[target], predictions_random_forest))
print("RMSE (Random Forest Regression):", rmse_random_forest)

# Jika RMSE kurang dari atau sama dengan 15, maka berlangganan GPT-4
if rmse_random_forest <= 15:
    print("Anda dapat berlangganan GPT-4!")
else:
    print("Maaf, RMSE masih tinggi. Coba tuning model atau fitur lainnya.")


RMSE (Random Forest Regression): 30.05530477918409
Maaf, RMSE masih tinggi. Coba tuning model atau fitur lainnya.
