# Pandas visualization

In [1]:
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt

%matplotlib notebook

In [2]:
plt.style.available

['Solarize_Light2',
 '_classic_test_patch',
 'bmh',
 'classic',
 'dark_background',
 'fast',
 'fivethirtyeight',
 'ggplot',
 'grayscale',
 'seaborn',
 'seaborn-bright',
 'seaborn-colorblind',
 'seaborn-dark',
 'seaborn-dark-palette',
 'seaborn-darkgrid',
 'seaborn-deep',
 'seaborn-muted',
 'seaborn-notebook',
 'seaborn-paper',
 'seaborn-pastel',
 'seaborn-poster',
 'seaborn-talk',
 'seaborn-ticks',
 'seaborn-white',
 'seaborn-whitegrid',
 'tableau-colorblind10']

In [3]:
plt.style.use('seaborn-colorblind')

# DataFrame

In [4]:
np.random.seed(123)

df = pd.DataFrame({'A': np.random.randn(365).cumsum(0), 
                   'B': np.random.randn(365).cumsum(0) + 20,
                   'C': np.random.randn(365).cumsum(0) - 20}, 
                  index=pd.date_range('1/1/2017', periods=365))
df.head()

Unnamed: 0,A,B,C
2017-01-01,-1.085631,20.059291,-20.230904
2017-01-02,-0.088285,21.803332,-16.659325
2017-01-03,0.194693,20.835588,-17.055481
2017-01-04,-1.311601,21.255156,-17.093802
2017-01-05,-1.890202,21.462083,-19.518638


In [5]:
df.plot()

<IPython.core.display.Javascript object>

<AxesSubplot:>

In [6]:
df.plot('A', 'B', kind='scatter')

<IPython.core.display.Javascript object>

<AxesSubplot:xlabel='A', ylabel='B'>

In [10]:
df.plot.scatter('A', 'C', c='B', s=df['B'], colormap='viridis')

<IPython.core.display.Javascript object>

<AxesSubplot:xlabel='A', ylabel='C'>

In [11]:
ax = df.plot.scatter('A', 'C', c='B', s=df['B'], colormap='viridis')
ax.set_aspect('equal')

<IPython.core.display.Javascript object>

In [12]:
df.plot.box()

<IPython.core.display.Javascript object>

<AxesSubplot:>

In [13]:
df.plot.hist(alpha=0.7)

<IPython.core.display.Javascript object>

<AxesSubplot:ylabel='Frequency'>

In [14]:
df.plot.kde()

<IPython.core.display.Javascript object>

<AxesSubplot:ylabel='Density'>

### pandas.tools.plotting

In [19]:
iris = pd.read_csv('iris.csv')
iris.head()

Unnamed: 0,SepalLength,SepalWidth,PetalLength,PetalWidth,Name
0,5.1,3.5,1.4,0.2,Iris-setosa
1,4.9,3.0,1.4,0.2,Iris-setosa
2,4.7,3.2,1.3,0.2,Iris-setosa
3,4.6,3.1,1.5,0.2,Iris-setosa
4,5.0,3.6,1.4,0.2,Iris-setosa


In [21]:
pd.plotting.scatter_matrix(iris)

<IPython.core.display.Javascript object>

array([[<AxesSubplot:xlabel='SepalLength', ylabel='SepalLength'>,
        <AxesSubplot:xlabel='SepalWidth', ylabel='SepalLength'>,
        <AxesSubplot:xlabel='PetalLength', ylabel='SepalLength'>,
        <AxesSubplot:xlabel='PetalWidth', ylabel='SepalLength'>],
       [<AxesSubplot:xlabel='SepalLength', ylabel='SepalWidth'>,
        <AxesSubplot:xlabel='SepalWidth', ylabel='SepalWidth'>,
        <AxesSubplot:xlabel='PetalLength', ylabel='SepalWidth'>,
        <AxesSubplot:xlabel='PetalWidth', ylabel='SepalWidth'>],
       [<AxesSubplot:xlabel='SepalLength', ylabel='PetalLength'>,
        <AxesSubplot:xlabel='SepalWidth', ylabel='PetalLength'>,
        <AxesSubplot:xlabel='PetalLength', ylabel='PetalLength'>,
        <AxesSubplot:xlabel='PetalWidth', ylabel='PetalLength'>],
       [<AxesSubplot:xlabel='SepalLength', ylabel='PetalWidth'>,
        <AxesSubplot:xlabel='SepalWidth', ylabel='PetalWidth'>,
        <AxesSubplot:xlabel='PetalLength', ylabel='PetalWidth'>,
        <AxesSubplot:

In [22]:
plt.figure()
pd.plotting.parallel_coordinates(iris, 'Name')

<IPython.core.display.Javascript object>

<AxesSubplot:>

In [25]:
import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns

%matplotlib notebook

In [28]:
np.random.seed(1234)

v1 = pd.Series(np.random.normal(0, 10,1000), name='v1')
v2 = pd.Series(2*v1 + np.random.normal(60, 15, 1000), name='v2')

In [29]:
plt.figure
plt.hist(v1, alpha=0.7, bins=np.arange(-50, 150, 5), label='v1')
plt.hist(v2, alpha=0.7, bins=np.arange(-50, 150, 5), label='v2')
plt.legend()

<IPython.core.display.Javascript object>

<matplotlib.legend.Legend at 0x2a519cc0640>

In [31]:
plt.figure()
plt.hist([v1,v2], histtype='barstacked')
v3=np.concatenate((v1,v2))
sns.kdeplot(v3)

<IPython.core.display.Javascript object>

<AxesSubplot:ylabel='Density'>

In [32]:
plt.figure()
sns.distplot(v3, hist_kws={'color': 'Teal'}, kde_kws={'color': 'Navy'})

<IPython.core.display.Javascript object>



<AxesSubplot:ylabel='Density'>

In [34]:
sns.jointplot(v1,v2,alpha=0.4)



<IPython.core.display.Javascript object>

<seaborn.axisgrid.JointGrid at 0x2a51ae09670>

In [35]:
grid = sns.jointplot(v1, v2, alpha=0.4)
grid.ax_joint.set_aspect('equal')



<IPython.core.display.Javascript object>

In [36]:
sns.jointplot(v1, v2, kind='hex')



<IPython.core.display.Javascript object>

<seaborn.axisgrid.JointGrid at 0x2a51d8ba130>

In [37]:
sns.set_style('white')

sns.jointplot(v1, v2, kind='kde', space=0)



<IPython.core.display.Javascript object>

<seaborn.axisgrid.JointGrid at 0x2a51df70370>

In [38]:
iris.head()

Unnamed: 0,SepalLength,SepalWidth,PetalLength,PetalWidth,Name
0,5.1,3.5,1.4,0.2,Iris-setosa
1,4.9,3.0,1.4,0.2,Iris-setosa
2,4.7,3.2,1.3,0.2,Iris-setosa
3,4.6,3.1,1.5,0.2,Iris-setosa
4,5.0,3.6,1.4,0.2,Iris-setosa


In [39]:
sns.pairplot(iris, hue='Name', diag_kind='kde')

<IPython.core.display.Javascript object>

<seaborn.axisgrid.PairGrid at 0x2a51e07b0d0>

In [41]:
plt.figure(figsize=(128, 8))
plt.subplot(121)
sns.swarmplot('Name', 'PetalLength', data=iris)
plt.subplot(122)
sns.violinplot('Name', 'PetalLength', data=iris)

<IPython.core.display.Javascript object>



<AxesSubplot:xlabel='Name', ylabel='PetalLength'>