###  Creating the Ml pipeline from ETL Data

In [2]:
# import libraries
import pandas as pd
from sqlalchemy import create_engine
import os

In [3]:
os.chdir("..")

In [4]:
# load data from database
engine = create_engine('sqlite:///data/disaster_response.db')
df = pd.read_sql('select * from messages1', engine)
df.head()

Unnamed: 0,id,message,original,genre,categories,related,request,offer,aid_related,medical_help,...,aid_centers,other_infrastructure,weather_related,floods,storm,fire,earthquake,cold,other_weather,direct_report
0,2,Weather update - a cold front from Cuba that c...,Un front froid se retrouve sur Cuba ce matin. ...,direct,related-1;request-0;offer-0;aid_related-0;medi...,1,0,0,0,0,...,0,0,0,0,0,0,0,0,0,0
1,7,Is the Hurricane over or is it not over,Cyclone nan fini osinon li pa fini,direct,related-1;request-0;offer-0;aid_related-1;medi...,1,0,0,1,0,...,0,0,1,0,1,0,0,0,0,0
2,8,Looking for someone but no name,"Patnm, di Maryani relem pou li banm nouvel li ...",direct,related-1;request-0;offer-0;aid_related-0;medi...,1,0,0,0,0,...,0,0,0,0,0,0,0,0,0,0
3,9,UN reports Leogane 80-90 destroyed. Only Hospi...,UN reports Leogane 80-90 destroyed. Only Hospi...,direct,related-1;request-1;offer-0;aid_related-1;medi...,1,1,0,1,0,...,0,0,0,0,0,0,0,0,0,0
4,12,"says: west side of Haiti, rest of the country ...",facade ouest d Haiti et le reste du pays aujou...,direct,related-1;request-0;offer-0;aid_related-0;medi...,1,0,0,0,0,...,0,0,0,0,0,0,0,0,0,0


## Tokenizing the Data

In [5]:
import nltk
import re
nltk.download(['punkt', 'wordnet'])
from nltk.tokenize import word_tokenize
from nltk.stem import WordNetLemmatizer
def tokenize(text):
    text = re.sub(r'[^\w\s]','',text)
    tokens = word_tokenize(text)
    lemmatizer = WordNetLemmatizer()

    clean_tokens = []
    for tok in tokens:
        clean_tok = lemmatizer.lemmatize(tok).lower().strip()
        clean_tokens.append(clean_tok)

    return clean_tokens

[nltk_data] Downloading package punkt to /home/jetfire/nltk_data...
[nltk_data]   Package punkt is already up-to-date!
[nltk_data] Downloading package wordnet to /home/jetfire/nltk_data...
[nltk_data]   Package wordnet is already up-to-date!


In [6]:
df['tokens'] = df.message.apply(lambda x:tokenize(x))

In [7]:
## Making Independent Values and dependent Values
X = df['message']
y = df.iloc[:, 5:39]

In [8]:
y.columns.tolist()

['related',
 'request',
 'offer',
 'aid_related',
 'medical_help',
 'medical_products',
 'search_and_rescue',
 'security',
 'military',
 'child_alone',
 'water',
 'food',
 'shelter',
 'clothing',
 'money',
 'missing_people',
 'refugees',
 'death',
 'other_aid',
 'infrastructure_related',
 'transport',
 'buildings',
 'electricity',
 'tools',
 'hospitals',
 'shops',
 'aid_centers',
 'other_infrastructure',
 'weather_related',
 'floods',
 'storm',
 'fire',
 'earthquake',
 'cold']

In [9]:
y['related'].replace(2, 1, inplace=True)

In [10]:
y['related'].unique()

array([1, 0])

In [11]:
y

Unnamed: 0,related,request,offer,aid_related,medical_help,medical_products,search_and_rescue,security,military,child_alone,...,hospitals,shops,aid_centers,other_infrastructure,weather_related,floods,storm,fire,earthquake,cold
0,1,0,0,0,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,0
1,1,0,0,1,0,0,0,0,0,0,...,0,0,0,0,1,0,1,0,0,0
2,1,0,0,0,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,0
3,1,1,0,1,0,1,0,0,0,0,...,1,0,0,0,0,0,0,0,0,0
4,1,0,0,0,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,0
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
26211,0,0,0,0,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,0
26212,0,0,0,0,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,0
26213,1,0,0,0,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,0
26214,1,0,0,1,0,0,0,0,1,0,...,0,0,0,0,0,0,0,0,0,0


In [12]:
from sklearn.pipeline import Pipeline
from sklearn.ensemble import RandomForestClassifier
from sklearn.feature_extraction.text import CountVectorizer, TfidfTransformer
from sklearn.multioutput import MultiOutputClassifier

In [13]:
pipeline = Pipeline([
        ('vect', CountVectorizer(tokenizer=tokenize)),
        ('tfidf', TfidfTransformer()),
        ('clf', MultiOutputClassifier(RandomForestClassifier()))
    ])

In [14]:
from sklearn.model_selection import train_test_split
X_train, X_test, y_train, y_test = train_test_split(X, y)
pipeline.fit(X_train, y_train)

  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default valu

Pipeline(memory=None,
         steps=[('vect',
                 CountVectorizer(analyzer='word', binary=False,
                                 decode_error='strict',
                                 dtype=<class 'numpy.int64'>, encoding='utf-8',
                                 input='content', lowercase=True, max_df=1.0,
                                 max_features=None, min_df=1,
                                 ngram_range=(1, 1), preprocessor=None,
                                 stop_words=None, strip_accents=None,
                                 token_pattern='(?u)\\b\\w\\w+\\b',
                                 tokenizer=<function tokenize at...
                 MultiOutputClassifier(estimator=RandomForestClassifier(bootstrap=True,
                                                                        class_weight=None,
                                                                        criterion='gini',
                                                                  

In [32]:
y_pred = pipeline.predict(X_test)

In [33]:
y_pred_df = pd.DataFrame(y_pred, columns=y_test.columns)

In [20]:
from sklearn.metrics import classification_report

In [35]:
print(classification_report(y_test, y_pred, target_names=y.columns.tolist()))

                        precision    recall  f1-score   support

               related       0.83      0.93      0.88      5042
               request       0.84      0.37      0.52      1125
                 offer       0.00      0.00      0.00        28
           aid_related       0.75      0.53      0.62      2732
          medical_help       0.58      0.09      0.16       512
      medical_products       0.64      0.12      0.20       308
     search_and_rescue       0.60      0.02      0.03       181
              security       0.50      0.01      0.02       114
              military       0.58      0.06      0.12       216
           child_alone       0.00      0.00      0.00         0
                 water       0.84      0.16      0.27       448
                  food       0.81      0.34      0.48       761
               shelter       0.76      0.19      0.30       580
              clothing       0.60      0.09      0.16       101
                 money       0.14      

  precision = _prf_divide(tp_sum, pred_sum,
  recall = _prf_divide(tp_sum, true_sum,
  precision = _prf_divide(tp_sum, pred_sum,
  recall = _prf_divide(tp_sum, true_sum,


In [38]:
for i in range(34):
    print("Precision, Recall, F1 Score for {}".format(y_test.columns[i]))
    print(classification_report(y_test.iloc[:,i], y_pred[:,i]))

Precision, Recall, F1 Score for related
              precision    recall  f1-score   support

           0       0.60      0.36      0.45      1512
           1       0.83      0.93      0.88      5042

    accuracy                           0.80      6554
   macro avg       0.72      0.64      0.66      6554
weighted avg       0.78      0.80      0.78      6554

Precision, Recall, F1 Score for request
              precision    recall  f1-score   support

           0       0.88      0.98      0.93      5429
           1       0.84      0.37      0.52      1125

    accuracy                           0.88      6554
   macro avg       0.86      0.68      0.72      6554
weighted avg       0.88      0.88      0.86      6554

Precision, Recall, F1 Score for offer
              precision    recall  f1-score   support

           0       1.00      1.00      1.00      6526
           1       0.00      0.00      0.00        28

    accuracy                           1.00      6554
   macro a

In [39]:
from sklearn.model_selection import GridSearchCV
parameters = {
        'vect__ngram_range': ((1, 1), (1, 2)),
        'vect__max_df': (0.5, 0.75, 1.0),
        'tfidf__use_idf': (True, False)
    }

cv = GridSearchCV(pipeline, param_grid=parameters)

In [40]:
cv.fit(X_train, y_train)
y_pred = cv.predict(X_test)

  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default valu

  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default valu

  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default valu

  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default valu

  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default valu

  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default valu

  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default valu

  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default valu

  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default valu

  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default valu

  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default valu

  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default valu

  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default valu

  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default valu

  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default valu

  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default valu

  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default valu

  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default valu

  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default valu

  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default valu

  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default valu

  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default valu

  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default valu

  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default valu

  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default valu

  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default valu

  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default valu

  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default valu

  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default valu

  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default valu

  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default valu

  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default valu

  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default valu

  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default valu

  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default valu

  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default valu

  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default value of n_estimators will change from "
  warn("The default valu

  warn("The default value of n_estimators will change from "


In [41]:
print(classification_report(y_test, y_pred, target_names=y.columns.tolist()))

                        precision    recall  f1-score   support

               related       0.82      0.94      0.88      5042
               request       0.86      0.39      0.54      1125
                 offer       0.00      0.00      0.00        28
           aid_related       0.77      0.47      0.58      2732
          medical_help       0.62      0.07      0.12       512
      medical_products       0.73      0.14      0.23       308
     search_and_rescue       0.75      0.07      0.12       181
              security       0.50      0.02      0.03       114
              military       0.63      0.06      0.10       216
           child_alone       0.00      0.00      0.00         0
                 water       0.88      0.24      0.38       448
                  food       0.85      0.46      0.60       761
               shelter       0.81      0.19      0.31       580
              clothing       0.67      0.04      0.07       101
                 money       0.88      

  precision = _prf_divide(tp_sum, pred_sum,
  recall = _prf_divide(tp_sum, true_sum,
  precision = _prf_divide(tp_sum, pred_sum,
  recall = _prf_divide(tp_sum, true_sum,


In [16]:
import xgboost as xgb

In [17]:
pipeline = Pipeline([
        ('vect', CountVectorizer(tokenizer=tokenize)),
        ('tfidf', TfidfTransformer()),
        ('clf', MultiOutputClassifier(xgb.XGBClassifier()))
    ])

In [18]:
pipeline.fit(X_train, y_train)
y_pred = pipeline.predict(X_test)







In [21]:
print(classification_report(y_test, y_pred, target_names=y.columns.tolist()))

                        precision    recall  f1-score   support

               related       0.84      0.94      0.89      5027
               request       0.78      0.58      0.66      1099
                 offer       0.00      0.00      0.00        27
           aid_related       0.78      0.67      0.72      2702
          medical_help       0.61      0.26      0.36       516
      medical_products       0.64      0.30      0.41       331
     search_and_rescue       0.64      0.15      0.24       186
              security       0.60      0.02      0.04       135
              military       0.60      0.32      0.41       203
           child_alone       0.00      0.00      0.00         0
                 water       0.82      0.66      0.73       422
                  food       0.82      0.75      0.78       741
               shelter       0.77      0.56      0.65       579
              clothing       0.70      0.53      0.60        91
                 money       0.60      

  precision = _prf_divide(tp_sum, pred_sum,
  recall = _prf_divide(tp_sum, true_sum,
  precision = _prf_divide(tp_sum, pred_sum,
  recall = _prf_divide(tp_sum, true_sum,


#### Compared to RF model with gridsearch XGBoost preformed better will be using for deployment 

####  Saving the model

In [22]:
import pickle
filename = 'XGB_Model.pkl'
pickle.dump(pipeline, open(filename, 'wb'))