# Load CSV with Pandas

Load a csv file and do operations on it

In our example we are loading a list of car metrics, to later make predictions of the gasoline consumptions based on some other metrics of a car that is going to be build.

In [None]:
# function to calculate L per 100km based on Mile per gallon
def mlg_to_l_per_100km(mpg):
    LITERS_PER_GALLON = 3.785411784
    KILOMETERS_PER_MILE = 1.609344

    return (100 * LITERS_PER_GALLON) / (KILOMETERS_PER_MILE * mpg)

In [None]:
print(mlg_to_l_per_100km(100))

In [None]:
import pandas as pd

In [None]:
# load the dataset
df = pd.read_csv("./data/mpg-dataset.csv")
print(df)

In [None]:
# read the cylinders, horsepower and weight as X
X = df[["cylinders", "horsepower", "weight"]]
y = mlg_to_l_per_100km(df["mpg"])

In [None]:
import numpy as np
from sklearn.linear_model import LinearRegression

model = LinearRegression(fit_intercept=True)

# teach the model
model.fit(X, y)

# return the learned coefficients
# the coefficients equal the weights of the inputs
print(model.coef_)

# return the learned intercept
print(model.intercept_)

In [None]:
# Predict the L per 100 Km for our car
# with 8 cylinders, 200 Horsepowers and 2500kg weight
print(model.predict([
    [8, 200, 2500]
])) 