# Train a model to predict a high income earner based on socioeconomic background

In [1]:
from fastai.tabular.all import *
# Uses the Adult dataset from the paper "Scaling up the accuracy of Naive-Bayes Classifiers
# initialize the data for the model using the data loader
path = untar_data(URLs.ADULT_SAMPLE)

dls = TabularDataLoaders.from_csv(
    path/'adult.csv',
    path=path,
    y_names="salary",
    # categorical values (values that are of discrete set of choices such as occupation)
    cat_names=['workclass','education','marital-status','occupation','relationship', 'race'],
    # continuous values (values that represent a changing quantity such as age)
    cont_names=['age', 'fnlwgt', 'education-num'],
    procs=[Categorify, FillMissing, Normalize]
)



In [None]:
# initialize the model with the data loaded in the data loader

learn = tabular_learner(dls,metrics=accuracy)

In [None]:
# There is no pretrained model available for this task (in general, pretrained models are not widely
# available for any tabular modeling tasks, so we do not use fine_tune
learn.fit_one_cycle(3)
learn.show_results()