In [1]:
%matplotlib notebook

In [2]:
# Dependencies
import matplotlib.pyplot as plt
import numpy as np
import pandas as pd

### Using MatplotLib to Chart a DataFrame

In [10]:
# Load in csv
rain_df = pd.read_csv("../Resources/avg_rain_state.csv")
rain_df.head()

Unnamed: 0,State,Inches,Milli­metres,Rank
0,Alabama,58.3,1480,4
1,Alaska,22.5,572,39
2,Arizona,13.6,345,47
3,Arkansas,50.6,1284,8
4,California,22.2,563,40


In [4]:
# Set x axis and tick locations
x_axis = np.arange(len(rain_df))
tick_locations = [value for value in x_axis]

In [6]:
# Create a list indicating where to write x labels and set figure size to adjust for space
plt.figure(figsize=(20,3))
plt.bar(x_axis, rain_df["Inches"], color='r', alpha=0.5, align="center")
plt.xticks(tick_locations, rain_df["State"], rotation="vertical")

<IPython.core.display.Javascript object>

([<matplotlib.axis.XTick at 0x1230aa278>,
  <matplotlib.axis.XTick at 0x1230adb00>,
  <matplotlib.axis.XTick at 0x1230ad860>,
  <matplotlib.axis.XTick at 0x12313a5c0>,
  <matplotlib.axis.XTick at 0x12313a940>,
  <matplotlib.axis.XTick at 0x12313ae10>,
  <matplotlib.axis.XTick at 0x123142320>,
  <matplotlib.axis.XTick at 0x1231427f0>,
  <matplotlib.axis.XTick at 0x123142cc0>,
  <matplotlib.axis.XTick at 0x12314b1d0>,
  <matplotlib.axis.XTick at 0x12314b6a0>,
  <matplotlib.axis.XTick at 0x12314bb70>,
  <matplotlib.axis.XTick at 0x1231520f0>,
  <matplotlib.axis.XTick at 0x12314b9e8>,
  <matplotlib.axis.XTick at 0x123142940>,
  <matplotlib.axis.XTick at 0x12313aa20>,
  <matplotlib.axis.XTick at 0x1231528d0>,
  <matplotlib.axis.XTick at 0x123152dd8>,
  <matplotlib.axis.XTick at 0x123159320>,
  <matplotlib.axis.XTick at 0x123159828>,
  <matplotlib.axis.XTick at 0x123159d30>,
  <matplotlib.axis.XTick at 0x123163278>,
  <matplotlib.axis.XTick at 0x123163780>,
  <matplotlib.axis.XTick at 0x1231

In [7]:
# Set x and y limits
plt.xlim(-0.75, len(x_axis))
plt.ylim(0, max(rain_df["Inches"])+10)

(0, 73.7)

In [8]:
# Set a Title and labels
plt.title("Average Rain per State")
plt.xlabel("State")
plt.ylabel("Average Amount of Rainfall in Inches")

Text(433.94444444444446, 0.5, 'Average Amount of Rainfall in Inches')

In [8]:
# Save our graph and show the grap
plt.tight_layout()
plt.savefig("../Images/avg_state_rain.png")
plt.show()

### Using Pandas to Chart a DataFrame

In [9]:
# Filter the DataFrame down only to those columns to chart
state_and_inches = rain_df[["State","Inches"]]

# Set the index to be "State" so they will be used as labels
state_and_inches = state_and_inches.set_index("State")

state_and_inches.head()

Unnamed: 0_level_0,Inches
State,Unnamed: 1_level_1
Alabama,58.3
Alaska,22.5
Arizona,13.6
Arkansas,50.6
California,22.2


In [10]:
# Use DataFrame.plot() in order to create a bar chart of the data
state_and_inches.plot(kind="bar", figsize=(20,3))

# Set a title for the chart
plt.title("Average Rain Per State")

plt.show()
plt.tight_layout()

<IPython.core.display.Javascript object>

In [11]:
# Pandas can also plot multiple columns if the DataFrame includes them
multi_plot = rain_df.plot(kind="bar", figsize=(20,5))

# PandasPlot.set_xticklabels() can be used to set the tick labels as well
multi_plot.set_xticklabels(rain_df["State"], rotation=45)

plt.show()
plt.tight_layout()

<IPython.core.display.Javascript object>