In [1]:
'''
表格样式创建
表格视觉样式：Dataframe.style → 返回pandas.Styler对象的属性，具有格式化和显示Dataframe的有用方法
样式创建：
① Styler.applymap：elementwise → 按元素方式处理Dataframe
② Styler.apply：column- / row- / table-wise → 按行/列处理Dataframe
 
'''

'\n表格样式创建\n表格视觉样式：Dataframe.style → 返回pandas.Styler对象的属性，具有格式化和显示Dataframe的有用方法\n样式创建：\n① Styler.applymap：elementwise → 按元素方式处理Dataframe\n② Styler.apply：column- / row- / table-wise → 按行/列处理Dataframe\n \n'

In [2]:
import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
% matplotlib inline

# 样式

In [3]:
df = pd.DataFrame(np.random.randn(10,4),columns=['a','b','c','d'])
sty = df.style
print(sty,type(sty))
# 查看样式类型
sty
# 显示样式

<pandas.io.formats.style.Styler object at 0x00000232F28FA320> <class 'pandas.io.formats.style.Styler'>


Unnamed: 0,a,b,c,d
0,-1.2781,0.418737,0.225638,0.0740286
1,-2.5983,0.73293,-0.589586,-1.55728
2,0.668775,0.809012,-1.29073,0.964961
3,1.14403,-1.25876,0.154142,-0.667677
4,0.723197,1.07975,-0.893756,-0.980516
5,-1.10681,-0.684718,1.38121,0.0225004
6,1.13461,-2.24267,-0.148927,-0.33527
7,-0.3136,0.31674,-0.0961875,-0.528395
8,-1.61626,1.76631,-1.58776,0.964983
9,0.158542,1.87394,0.938945,0.452844


# 按元素处理样式：style.applymap()

In [4]:
def color_neg_red(val):
    if val < 0:
        color = 'red'
    else:
        color = 'black'
    return('color:%s' % color)
df.style.applymap(color_neg_red)
# 创建样式方法，使得小于0的数变成红色
# style.applymap() → 自动调用其中的函数

Unnamed: 0,a,b,c,d
0,-1.2781,0.418737,0.225638,0.0740286
1,-2.5983,0.73293,-0.589586,-1.55728
2,0.668775,0.809012,-1.29073,0.964961
3,1.14403,-1.25876,0.154142,-0.667677
4,0.723197,1.07975,-0.893756,-0.980516
5,-1.10681,-0.684718,1.38121,0.0225004
6,1.13461,-2.24267,-0.148927,-0.33527
7,-0.3136,0.31674,-0.0961875,-0.528395
8,-1.61626,1.76631,-1.58776,0.964983
9,0.158542,1.87394,0.938945,0.452844


In [5]:
# 按行/列处理样式：style.apply()

def highlight_max(s):
    is_max = s == s.max()
    #print(is_max)
    lst = []
    for v in is_max:
        if v:
            lst.append('background-color: yellow')
        else:
            lst.append('')
    return(lst)
df.style.apply(highlight_max, axis = 0, subset = ['b','c'])
# 创建样式方法，每列最大值填充黄色
# axis：0为列，1为行，默认为0
# subset：索引

Unnamed: 0,a,b,c,d
0,-1.2781,0.418737,0.225638,0.0740286
1,-2.5983,0.73293,-0.589586,-1.55728
2,0.668775,0.809012,-1.29073,0.964961
3,1.14403,-1.25876,0.154142,-0.667677
4,0.723197,1.07975,-0.893756,-0.980516
5,-1.10681,-0.684718,1.38121,0.0225004
6,1.13461,-2.24267,-0.148927,-0.33527
7,-0.3136,0.31674,-0.0961875,-0.528395
8,-1.61626,1.76631,-1.58776,0.964983
9,0.158542,1.87394,0.938945,0.452844


In [6]:
# 样式索引、切片

df.style.apply(highlight_max, axis = 1, 
               subset = pd.IndexSlice[2:5,['b', 'd']])
# 通过pd.IndexSlice[]调用切片
# 也可：df[2:5].style.apply(highlight_max, subset = ['b', 'd']) → 先索引行再做样式

Unnamed: 0,a,b,c,d
0,-1.2781,0.418737,0.225638,0.0740286
1,-2.5983,0.73293,-0.589586,-1.55728
2,0.668775,0.809012,-1.29073,0.964961
3,1.14403,-1.25876,0.154142,-0.667677
4,0.723197,1.07975,-0.893756,-0.980516
5,-1.10681,-0.684718,1.38121,0.0225004
6,1.13461,-2.24267,-0.148927,-0.33527
7,-0.3136,0.31674,-0.0961875,-0.528395
8,-1.61626,1.76631,-1.58776,0.964983
9,0.158542,1.87394,0.938945,0.452844


In [7]:
'''
  表格显示控制

df.style.format()
 
'''

'\n  表格显示控制\n\ndf.style.format()\n \n'

In [8]:
# 按照百分数显示

df = pd.DataFrame(np.random.randn(10,4),columns=['a','b','c','d'])
print(df.head())
df.head().style.format("{:.2%}")

          a         b         c         d
0 -0.954633  0.350287 -0.073404 -0.073680
1 -0.590143 -0.877179 -0.224328 -2.028683
2  1.766204  0.462374 -0.984897  0.711906
3  0.654040 -1.157215 -0.920077  0.696361
4 -0.200869 -1.466273 -0.336093  2.386551


Unnamed: 0,a,b,c,d
0,-95.46%,35.03%,-7.34%,-7.37%
1,-59.01%,-87.72%,-22.43%,-202.87%
2,176.62%,46.24%,-98.49%,71.19%
3,65.40%,-115.72%,-92.01%,69.64%
4,-20.09%,-146.63%,-33.61%,238.66%


In [9]:
# 显示小数点数

df.head().style.format("{:.4f}")

Unnamed: 0,a,b,c,d
0,-0.9546,0.3503,-0.0734,-0.0737
1,-0.5901,-0.8772,-0.2243,-2.0287
2,1.7662,0.4624,-0.9849,0.7119
3,0.654,-1.1572,-0.9201,0.6964
4,-0.2009,-1.4663,-0.3361,2.3866


In [10]:
# 显示正负数

df.head().style.format("{:+.2f}")

Unnamed: 0,a,b,c,d
0,-0.95,0.35,-0.07,-0.07
1,-0.59,-0.88,-0.22,-2.03
2,1.77,0.46,-0.98,0.71
3,0.65,-1.16,-0.92,0.7
4,-0.2,-1.47,-0.34,2.39


# 分列显示

In [11]:
df.head().style.format({'b':"{:.2%}", 'c':"{:+.3f}", 'd':"{:.3f}"})

Unnamed: 0,a,b,c,d
0,-0.954633,35.03%,-0.073,-0.074
1,-0.590143,-87.72%,-0.224,-2.029
2,1.7662,46.24%,-0.985,0.712
3,0.65404,-115.72%,-0.92,0.696
4,-0.200869,-146.63%,-0.336,2.387


In [12]:
'''
  表格样式调用

Styler内置样式调用
 
'''

'\n  表格样式调用\n\nStyler内置样式调用\n \n'

In [13]:
# 定位空值

df = pd.DataFrame(np.random.rand(5,4),columns = list('ABCD'))
df['A'][2] = np.nan
df.style.highlight_null(null_color='red')

Unnamed: 0,A,B,C,D
0,0.408379,0.88785,0.437147,0.763856
1,0.109124,0.189091,0.591946,0.138708
2,,0.581038,0.905752,0.596347
3,0.817651,0.818862,0.448148,0.545672
4,0.73854,0.47869,0.302168,0.707387


# 色彩映射

In [14]:
df = pd.DataFrame(np.random.rand(10,4),columns = list('ABCD'))
df.style.background_gradient(cmap='Greens',axis =1,low=0,high=1)
# cmap：颜色
# axis：映射参考，0为行，1以列

Unnamed: 0,A,B,C,D
0,0.524531,0.802931,0.793735,0.4317
1,0.618311,0.935626,0.0846534,0.102119
2,0.10835,0.116401,0.381709,0.7462
3,0.225649,0.0681239,0.0676053,0.904899
4,0.534463,0.393446,0.416612,0.499959
5,0.811279,0.915527,0.479173,0.407122
6,0.162478,0.839012,0.678219,0.0474624
7,0.787997,0.599783,0.245584,0.440729
8,0.81228,0.614313,0.314383,0.605323
9,0.35207,0.967864,0.847286,0.47223


# 条形图

In [15]:
df = pd.DataFrame(np.random.rand(10,4),columns = list('ABCD'))
df.style.bar(subset=['A', 'B'], color='#d65f5f', width=100)
# width：最长长度在格子的占比

Unnamed: 0,A,B,C,D
0,0.669808,0.727277,0.88143,0.216082
1,0.172375,0.810108,0.708697,0.711163
2,0.14076,0.0161554,0.635799,0.462228
3,0.561844,0.696598,0.650747,0.584565
4,0.746448,0.297093,0.177114,0.302726
5,0.296277,0.915002,0.648372,0.219756
6,0.989522,0.0496722,0.145517,0.179054
7,0.333671,0.432445,0.765766,0.843753
8,0.107061,0.311644,0.572357,0.963915
9,0.135124,0.0481449,0.65535,0.582926


# 分段式构建样式

In [16]:
df = pd.DataFrame(np.random.rand(10,4),columns = list('ABCD'))
df['A'][[3,2]] = np.nan
df.style.\
    bar(subset=['A', 'B'], color='#d65f5f', width=100).\
    highlight_null(null_color='yellow')

Unnamed: 0,A,B,C,D
0,0.318426,0.527578,0.647486,0.514422
1,0.983468,0.244126,0.618971,0.442012
2,,0.721955,0.22589,0.98797
3,,0.720817,0.373376,0.577468
4,0.751617,0.0141835,0.506119,0.867578
5,0.681766,0.142734,0.694553,0.162425
6,0.724368,0.347562,0.429871,0.260745
7,0.600076,0.712234,0.989385,0.706441
8,0.615825,0.57037,0.00786836,0.449531
9,0.865457,0.719777,0.17478,0.540804
