## Pandas Visualization

In [22]:
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt

%matplotlib notebook

In [4]:
# see the pre-defined styles provided.
plt.style.available

['seaborn-ticks',
 'seaborn-dark-palette',
 'seaborn-pastel',
 'seaborn-white',
 'grayscale',
 'seaborn-whitegrid',
 'seaborn',
 'seaborn-paper',
 'seaborn-talk',
 'seaborn-muted',
 'seaborn-poster',
 '_classic_test',
 'seaborn-notebook',
 'classic',
 'dark_background',
 'seaborn-darkgrid',
 'ggplot',
 'fivethirtyeight',
 'bmh',
 'seaborn-dark',
 'fast',
 'seaborn-deep',
 'seaborn-bright',
 'seaborn-colorblind',
 'Solarize_Light2']

In [3]:
# use the 'seaborn-colorblind' style
plt.style.use('seaborn-colorblind')

## DataFrame.plot

In [7]:
np.random.seed(123)

df = pd.DataFrame({'A': np.random.randn(365).cumsum(0), 
                   'B': np.random.randn(365).cumsum(0) + 20,
                   'C': np.random.randn(365).cumsum(0) - 20}, 
                  index=pd.date_range('1/1/2017', periods=365))
df.head()

Unnamed: 0,A,B,C
2017-01-01,-1.085631,20.059291,-20.230904
2017-01-02,-0.088285,21.803332,-16.659325
2017-01-03,0.194693,20.835588,-17.055481
2017-01-04,-1.311601,21.255156,-17.093802
2017-01-05,-1.890202,21.462083,-19.518638


In [8]:
df.plot()

<IPython.core.display.Javascript object>

<matplotlib.axes._subplots.AxesSubplot at 0x7f26fb92dfd0>

In [15]:
df.plot('A','B', kind = 'scatter');

<IPython.core.display.Javascript object>

In [16]:
# create a scatter plot of columns 'A' and 'C', with changing color (c) and size (s) based on column 'B'
df.plot.scatter('A', 'C', c='B', s=df['B'], colormap='viridis')

<IPython.core.display.Javascript object>

<matplotlib.axes._subplots.AxesSubplot at 0x7f26f33e9898>

In [17]:
ax = df.plot.scatter('A', 'C', c='B', s=df['B'], colormap='viridis')
ax.set_aspect('equal')

<IPython.core.display.Javascript object>

In [18]:
df.plot.box();

<IPython.core.display.Javascript object>

In [19]:
df.plot.hist(alpha=0.7);

<IPython.core.display.Javascript object>

In [20]:
df.plot.kde();

<IPython.core.display.Javascript object>

## pandas.tools.ploting

In [35]:
iris = pd.read_csv('iris.csv')
iris.head()

Unnamed: 0,5.1,0.222222222,3.5,0.625,1.4,0.06779661,0.2,0.041666667,setosa
0,4.9,0.166667,3.0,0.416667,1.4,0.067797,0.2,0.041667,setosa
1,4.7,0.111111,3.2,0.5,1.3,0.050847,0.2,0.041667,setosa
2,4.6,0.083333,3.1,0.458333,1.5,0.084746,0.2,0.041667,setosa
3,5.0,0.194444,3.6,0.666667,1.4,0.067797,0.2,0.041667,setosa
4,5.4,0.305556,3.9,0.791667,1.7,0.118644,0.4,0.125,setosa


## Seaborn

In [37]:
import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns

%matplotlib notebook

In [40]:
np.random.seed(1234)

v1 = pd.Series(np.random.normal(0,10,1000), name='v1')
v2 = pd.Series(2*v1 + np.random.normal(60,15,1000), name='v2')

In [42]:
plt.figure()
plt.hist(v1, alpha=0.7, bins=np.arange(-50,150,5), label='v1');
plt.hist(v2, alpha=0.7, bins=np.arange(-50,150,5), label='v2');
plt.legend();

<IPython.core.display.Javascript object>

In [43]:
plt.figure()
plt.hist(v1, alpha=0.7, bins=np.arange(-50,150,5), label='v1');
plt.hist(v2, alpha=0.7, bins=np.arange(-50,150,5), label='v2');
plt.legend();

<IPython.core.display.Javascript object>

In [46]:
# plot a kernel density estimation over a stacked barchart
plt.figure()
plt.hist([v1, v2], histtype='barstacked', normed=True);
v3 = np.concatenate((v1,v2))
sns.kdeplot(v3);

<IPython.core.display.Javascript object>

In [47]:
plt.figure()
# we can pass keyword arguments for each individual component of the plot
sns.distplot(v3, hist_kws={'color': 'Teal'}, kde_kws={'color': 'Navy'});

<IPython.core.display.Javascript object>

In [48]:
sns.jointplot(v1, v2, alpha=0.4);

<IPython.core.display.Javascript object>

In [49]:
grid = sns.jointplot(v1, v2, alpha=0.4);
grid.ax_joint.set_aspect('equal')

<IPython.core.display.Javascript object>

In [50]:
sns.jointplot(v1, v2, kind='hex');

<IPython.core.display.Javascript object>

In [51]:
# set the seaborn style for all the following plots
sns.set_style('white')

sns.jointplot(v1, v2, kind='kde', space=0);

<IPython.core.display.Javascript object>

In [58]:
iris = pd.read_csv('iris.csv')
iris.head()
sns.pairplot(iris, hue='Name', diag_kind='kde', size=2);

<IPython.core.display.Javascript object>

KeyError: 'Name'

In [59]:
plt.figure(figsize=(8,6))
plt.subplot(121)
sns.swarmplot('Name', 'PetalLength', data=iris);
plt.subplot(122)
sns.violinplot('Name', 'PetalLength', data=iris);

<IPython.core.display.Javascript object>

ValueError: Could not interpret input 'Name'