In [None]:
import numpy as np
import pandas as pd
from sklearn import preprocessing
from sklearn.model_selection import train_test_split
from sklearn.ensemble import GradientBoostingRegressor, RandomForestRegressor, ExtraTreesRegressor
from sklearn.ensemble import AdaBoostRegressor, GradientBoostingClassifier, RandomForestClassifier
from sklearn.ensemble import ExtraTreesClassifier, AdaBoostClassifier
import matplotlib.pyplot as plt
import seaborn as sns

In [None]:
df = pd.read_csv('../input/forest-fires-in-brazil/amazon.csv', encoding='latin1')
df = df.drop(['date'], 1)

print(df.head())

In [None]:
le = preprocessing.LabelEncoder()
df['state'] = le.fit_transform(df['state'])
df['month'] = le.fit_transform(df['month'])

print(df.head())

In [None]:
sns.pairplot(df)
plt.show()

In [None]:
year_map = {}
for _, row in df.iterrows():
    year = row['year']
    count = row['number']
    year_map[year] = count if year not in year_map else year_map[year] + count  
    
years = list(year_map.keys())
years.sort()
totals = []

for year in years:
    totals.append(year_map[year])
    
plt.style.use('seaborn-whitegrid')
plt.plot(years, totals)
plt.show()

In [None]:
sns.regplot(years, totals, ci=None)
plt.show()

In [None]:
sns.regplot(years, totals, ci=None, order=3)
plt.show()

In [None]:
prediction_label = 'number'

In [None]:
X = np.array(df.drop([prediction_label], 1))
y = np.array(df[prediction_label])

In [None]:
  X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=.3, random_state=42)

In [None]:
estimator = RandomForestRegressor(n_estimators=100)
estimator.fit(X_train, y_train)
accuracy = estimator.score(X_test, y_test)

print('Random Forest Regressor Accuracy: {}'.format(accuracy))

In [None]:
estimator = ExtraTreesRegressor(n_estimators=100)
estimator.fit(X_train, y_train)
accuracy = estimator.score(X_test, y_test)

print('Extra Trees Regressor Accuracy: {}'.format(accuracy))

In [None]:
estimator = AdaBoostRegressor(n_estimators=100)
estimator.fit(X_train, y_train)
accuracy = estimator.score(X_test, y_test)

print('Ada Boost Regressor Accuracy: {}'.format(accuracy))