In [1]:
%matplotlib notebook

In [2]:
# Dependencies
import matplotlib.pyplot as plt
import numpy as np
import pandas as pd

### Using MatplotLib to Chart a DataFrame

In [3]:
# Load in csv
rain_df = pd.read_csv("../Resources/avg_rain_state.csv")
rain_df.head()

Unnamed: 0,State,Inches,Milli­metres,Rank
0,Alabama,58.3,1480,4
1,Alaska,22.5,572,39
2,Arizona,13.6,345,47
3,Arkansas,50.6,1284,8
4,California,22.2,563,40


In [6]:
# Set x axis and tick locations
x_axis = np.arange(len(rain_df))
tick_locations = [value for value in x_axis]

In [7]:
# Create a list indicating where to write x labels and set figure size to adjust for space
plt.figure(figsize=(20,3))
plt.bar(x_axis, rain_df["Inches"], color='r', alpha=0.5, align="center")
plt.xticks(tick_locations, rain_df["State"], rotation="vertical")

<IPython.core.display.Javascript object>

([<matplotlib.axis.XTick at 0x18a3ee21e48>,
  <matplotlib.axis.XTick at 0x18a3f3e4748>,
  <matplotlib.axis.XTick at 0x18a3ee9c7c8>,
  <matplotlib.axis.XTick at 0x18a3ef433c8>,
  <matplotlib.axis.XTick at 0x18a3ef43b48>,
  <matplotlib.axis.XTick at 0x18a3ef49888>,
  <matplotlib.axis.XTick at 0x18a3ef4e748>,
  <matplotlib.axis.XTick at 0x18a3ef515c8>,
  <matplotlib.axis.XTick at 0x18a3ef55448>,
  <matplotlib.axis.XTick at 0x18a3ef5a2c8>,
  <matplotlib.axis.XTick at 0x18a3ef55548>,
  <matplotlib.axis.XTick at 0x18a3ef49148>,
  <matplotlib.axis.XTick at 0x18a3ef5fd88>,
  <matplotlib.axis.XTick at 0x18a3ef63ac8>,
  <matplotlib.axis.XTick at 0x18a3ef68808>,
  <matplotlib.axis.XTick at 0x18a3ef6c548>,
  <matplotlib.axis.XTick at 0x18a3ef6f348>,
  <matplotlib.axis.XTick at 0x18a3ef6cd08>,
  <matplotlib.axis.XTick at 0x18a3ef5f808>,
  <matplotlib.axis.XTick at 0x18a3ef74c88>,
  <matplotlib.axis.XTick at 0x18a3ef77a08>,
  <matplotlib.axis.XTick at 0x18a3ef7b788>,
  <matplotlib.axis.XTick at 0x18

In [9]:
# Set x and y limits
plt.xlim(-0.75, len(x_axis))
plt.ylim(0, max(rain_df["Inches"])+10)

(0.0, 73.7)

In [10]:
# Set a Title and labels
plt.title("Average Rain per State")
plt.xlabel("State")
plt.ylabel("Average Amount of Rainfall in Inches")

Text(325.45833333333337, 0.5, 'Average Amount of Rainfall in Inches')

In [11]:
# Save our graph and show the grap
plt.tight_layout()
plt.savefig("../Images/avg_state_rain.png")
plt.show()

### Using Pandas to Chart a DataFrame

In [12]:
# Filter the DataFrame down only to those columns to chart
state_and_inches = rain_df[["State","Inches"]]

# Set the index to be "State" so they will be used as labels
state_and_inches = state_and_inches.set_index("State")

state_and_inches.head()

Unnamed: 0_level_0,Inches
State,Unnamed: 1_level_1
Alabama,58.3
Alaska,22.5
Arizona,13.6
Arkansas,50.6
California,22.2


In [13]:
# Use DataFrame.plot() in order to create a bar chart of the data
state_and_inches.plot(kind="bar", figsize=(20,3))

# Set a title for the chart
plt.title("Average Rain Per State")

plt.show()
plt.tight_layout()

<IPython.core.display.Javascript object>

In [14]:
# Pandas can also plot multiple columns if the DataFrame includes them
multi_plot = rain_df.plot(kind="bar", figsize=(20,5))

# PandasPlot.set_xticklabels() can be used to set the tick labels as well
multi_plot.set_xticklabels(rain_df["State"], rotation=45)

plt.show()
plt.tight_layout()

<IPython.core.display.Javascript object>