In [1]:
import numpy as np
import pandas as pd
from matplotlib import pyplot as plt
from numpy import nan as NA
import seaborn as sns 
import jieba 

plt.rcParams['font.sans-serif'] = ['SimHei'] #用来显示中文标签
plt.rcParams['axes.unicode_minus'] = False #用来正常显示负号
import openpyxl as xl #配置单元格代码运行输出（可选）
from IPython.core.interactiveshell import InteractiveShell
InteractiveShell.ast_node_interactivity = "all"


## 1.数据清洗

In [2]:
data = pd.read_csv("./双十一淘宝美妆数据.csv",encoding = "utf-8",header = 0)
data.head(20)

Unnamed: 0,update_time,id,title,price,sale_count,comment_count,店名
0,2016/11/14,A18164178225,CHANDO/自然堂 雪域精粹纯粹滋润霜50g 补水保湿 滋润水润面霜,139.0,26719.0,2704.0,自然堂
1,2016/11/14,A18177105952,CHANDO/自然堂凝时鲜颜肌活乳液120ML 淡化细纹补水滋润专柜正品,194.0,8122.0,1492.0,自然堂
2,2016/11/14,A18177226992,CHANDO/自然堂活泉保湿修护精华水（滋润型135ml 补水控油爽肤水,99.0,12668.0,589.0,自然堂
3,2016/11/14,A18178033846,CHANDO/自然堂 男士劲爽控油洁面膏 100g 深层清洁 男士洗面奶,38.0,25805.0,4287.0,自然堂
4,2016/11/14,A18178045259,CHANDO/自然堂雪域精粹纯粹滋润霜（清爽型）50g补水保湿滋润霜,139.0,5196.0,618.0,自然堂
5,2016/11/14,A18178129035,自然堂 雪域纯粹滋润洗颜霜 110g 补水保湿 洗面奶女 深层清洁,88.0,42858.0,8426.0,自然堂
6,2016/11/14,A18178206572,CHANDO/自然堂雪润皙白晶采霜（滋润型）50g 滋润修护面霜 正品,139.0,3027.0,304.0,自然堂
7,2016/11/14,A18190290933,自然堂 活泉深层净化控油凝露60g 控油补水保湿滋润 活泉精华正品,86.0,6925.0,740.0,自然堂
8,2016/11/14,A18250630014,CHANDO/自然堂 凝时鲜颜肌活修护精华液35ml 淡化细纹护肤精华,216.0,4649.0,630.0,自然堂
9,2016/11/14,A18422797881,CHANDO/自然堂活泉保湿精华套装 保湿补水滋润控油面部护理套装,258.0,2293.0,43.0,自然堂


In [3]:
# 查看数据维度
data.shape

(27598, 7)

In [4]:
# 统计数据类型列常用描述性统计量
data.describe()

Unnamed: 0,price,sale_count,comment_count
count,27598.0,25244.0,25244.0
mean,362.8306,12301.77,1121.141816
std,614.17332,52336.93,5271.059822
min,1.0,0.0,0.0
25%,99.0,279.0,21.0
50%,205.0,1445.0,153.0
75%,390.0,6354.5,669.0
max,11100.0,1923160.0,202930.0


In [5]:
# 查看数据字段
data.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 27598 entries, 0 to 27597
Data columns (total 7 columns):
 #   Column         Non-Null Count  Dtype  
---  ------         --------------  -----  
 0   update_time    27598 non-null  object 
 1   id             27598 non-null  object 
 2   title          27598 non-null  object 
 3   price          27598 non-null  float64
 4   sale_count     25244 non-null  float64
 5   comment_count  25244 non-null  float64
 6   店名             27598 non-null  object 
dtypes: float64(3), object(4)
memory usage: 1.5+ MB


In [6]:
# 下单时间格式转换
data["update_time"] = pd.to_datetime(data["update_time"] )
data.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 27598 entries, 0 to 27597
Data columns (total 7 columns):
 #   Column         Non-Null Count  Dtype         
---  ------         --------------  -----         
 0   update_time    27598 non-null  datetime64[ns]
 1   id             27598 non-null  object        
 2   title          27598 non-null  object        
 3   price          27598 non-null  float64       
 4   sale_count     25244 non-null  float64       
 5   comment_count  25244 non-null  float64       
 6   店名             27598 non-null  object        
dtypes: datetime64[ns](1), float64(3), object(3)
memory usage: 1.5+ MB


In [7]:
#查看sale_count的缺失值
data[data["sale_count"].isnull()]

Unnamed: 0,update_time,id,title,price,sale_count,comment_count,店名
2011,2016-11-14,A527960599636,Shu uemura植村秀新无色限唇膏 口红 长效保湿滋润 显色持久 正品,215.0,,,植村秀
2012,2016-11-14,A528013549083,Shu uemura植村秀晶萃溢彩肌底液30ml 面部精华,590.0,,,植村秀
2013,2016-11-14,A528030330786,Shu uemura 植村秀无色限柔雾唇膏 哑光口红 保湿持久 高饱和显色,215.0,,,植村秀
2014,2016-11-14,A528091449317,shu uemura植村秀无色限唇颊缤纷霜 腮红 口红两用 唇彩 正品,220.0,,,植村秀
2015,2016-11-14,A528191935022,Shu uemura植村秀韵眉膏 染眉膏 多维度丰眉刷头,280.0,,,植村秀
...,...,...,...,...,...,...,...
27593,2016-11-05,A535642405757,SK-II【11-11】全新大眼眼霜skii放大双眼眼部修护精华紧致,590.0,,,SKII
27594,2016-11-05,A535911851408,SK-II 11-11预售skii大眼眼霜sk2眼部修护精华霜淡化黑眼圈,590.0,,,SKII
27595,2016-11-05,A537027211850,SK-II 11-11预售skii前男友护肤面膜sk2精华面膜贴密集修护,1740.0,,,SKII
27596,2016-11-05,A538212160126,SK-II 11-11预售skiisk2神仙水护肤精华油面部套装滋润补水密集修,1190.0,,,SKII


In [8]:
#查看comment_count的缺失值
data[data["comment_count"].isnull()]

Unnamed: 0,update_time,id,title,price,sale_count,comment_count,店名
2011,2016-11-14,A527960599636,Shu uemura植村秀新无色限唇膏 口红 长效保湿滋润 显色持久 正品,215.0,,,植村秀
2012,2016-11-14,A528013549083,Shu uemura植村秀晶萃溢彩肌底液30ml 面部精华,590.0,,,植村秀
2013,2016-11-14,A528030330786,Shu uemura 植村秀无色限柔雾唇膏 哑光口红 保湿持久 高饱和显色,215.0,,,植村秀
2014,2016-11-14,A528091449317,shu uemura植村秀无色限唇颊缤纷霜 腮红 口红两用 唇彩 正品,220.0,,,植村秀
2015,2016-11-14,A528191935022,Shu uemura植村秀韵眉膏 染眉膏 多维度丰眉刷头,280.0,,,植村秀
...,...,...,...,...,...,...,...
27593,2016-11-05,A535642405757,SK-II【11-11】全新大眼眼霜skii放大双眼眼部修护精华紧致,590.0,,,SKII
27594,2016-11-05,A535911851408,SK-II 11-11预售skii大眼眼霜sk2眼部修护精华霜淡化黑眼圈,590.0,,,SKII
27595,2016-11-05,A537027211850,SK-II 11-11预售skii前男友护肤面膜sk2精华面膜贴密集修护,1740.0,,,SKII
27596,2016-11-05,A538212160126,SK-II 11-11预售skiisk2神仙水护肤精华油面部套装滋润补水密集修,1190.0,,,SKII


In [9]:
#查看重复值
data[data.duplicated(keep = False) == True]

Unnamed: 0,update_time,id,title,price,sale_count,comment_count,店名
820,2016-11-07,A18177226992,CHANDO/自然堂活泉保湿修护精华水（滋润型135ml 补水控油爽肤水,99.0,6398.0,583.0,自然堂
821,2016-11-07,A18177226992,CHANDO/自然堂活泉保湿修护精华水（滋润型135ml 补水控油爽肤水,99.0,6398.0,583.0,自然堂
822,2016-11-07,A18177318911,自然堂 活泉补水洁面乳 125g 深层清洁滋润 正品包邮洗面奶女男,69.0,44112.0,7420.0,自然堂
823,2016-11-07,A18177318911,自然堂 活泉补水洁面乳 125g 深层清洁滋润 正品包邮洗面奶女男,69.0,44112.0,7420.0,自然堂
831,2016-11-07,A19009618209,CHANDO/自然堂凝时鲜颜套装水乳/霜套装 补水保湿滋润淡化细纹,348.0,14015.0,1782.0,自然堂
...,...,...,...,...,...,...,...
22019,2016-11-07,A38053046999,兰芝自然舒润防晒霜50ml SPF30/PA++ 清爽保湿全身女夏 官方直售,195.0,3205.0,91.0,兰芝
22086,2016-11-07,A540000709042,【11.11专享】兰芝多效净肤洁颜膏180ml 洗面奶深层清洁毛孔 补,205.0,13.0,0.0,兰芝
22087,2016-11-07,A540000709042,【11.11专享】兰芝多效净肤洁颜膏180ml 洗面奶深层清洁毛孔 补,205.0,13.0,0.0,兰芝
25791,2016-11-10,A528101929150,佰草集 新清透修护防晒液SPF30+ PA+++,180.0,3742.0,970.0,佰草集


In [10]:
#删除重复值
data = data.drop_duplicates()

In [11]:
#检查是否删除重复值
data[data.duplicated(keep = False) == True]

Unnamed: 0,update_time,id,title,price,sale_count,comment_count,店名


In [12]:
# 统计每列缺失值数量
data.isnull().sum()

update_time         0
id                  0
title               0
price               0
sale_count       2350
comment_count    2350
店名                  0
dtype: int64

In [13]:
#删除缺失值
data.dropna(inplace = True)
data.info()

<class 'pandas.core.frame.DataFrame'>
Index: 25162 entries, 0 to 27128
Data columns (total 7 columns):
 #   Column         Non-Null Count  Dtype         
---  ------         --------------  -----         
 0   update_time    25162 non-null  datetime64[ns]
 1   id             25162 non-null  object        
 2   title          25162 non-null  object        
 3   price          25162 non-null  float64       
 4   sale_count     25162 non-null  float64       
 5   comment_count  25162 non-null  float64       
 6   店名             25162 non-null  object        
dtypes: datetime64[ns](1), float64(3), object(3)
memory usage: 1.5+ MB


In [14]:
#修改列名
data.rename(columns ={'店名':'brand'},inplace =True)
data

Unnamed: 0,update_time,id,title,price,sale_count,comment_count,brand
0,2016-11-14,A18164178225,CHANDO/自然堂 雪域精粹纯粹滋润霜50g 补水保湿 滋润水润面霜,139.0,26719.0,2704.0,自然堂
1,2016-11-14,A18177105952,CHANDO/自然堂凝时鲜颜肌活乳液120ML 淡化细纹补水滋润专柜正品,194.0,8122.0,1492.0,自然堂
2,2016-11-14,A18177226992,CHANDO/自然堂活泉保湿修护精华水（滋润型135ml 补水控油爽肤水,99.0,12668.0,589.0,自然堂
3,2016-11-14,A18178033846,CHANDO/自然堂 男士劲爽控油洁面膏 100g 深层清洁 男士洗面奶,38.0,25805.0,4287.0,自然堂
4,2016-11-14,A18178045259,CHANDO/自然堂雪域精粹纯粹滋润霜（清爽型）50g补水保湿滋润霜,139.0,5196.0,618.0,自然堂
...,...,...,...,...,...,...,...
27124,2016-11-05,A539946580915,佰草集惊艳时光十八周年典萃限量礼盒护肤套装 预售有礼,380.0,722.0,0.0,佰草集
27125,2016-11-05,A539973230837,佰草集平衡洁面乳洗面奶100g*2支保湿补水控油 赠旅行套 预售有礼,96.0,3520.0,0.0,佰草集
27126,2016-11-05,A540021300133,Herborist/佰草集新七白美白嫩肤面膜260g 补水保湿嫩肤,420.0,10738.0,5494.0,佰草集
27127,2016-11-05,A540084337255,Herborist/佰草集新美肌梦幻曲面膜组23片装,580.0,0.0,0.0,佰草集


## 2 商品标题分词

### 2.1商品标题分词

In [15]:
data['item_name_cut'] = data['title'].apply(jieba.lcut)

Building prefix dict from the default dictionary ...
Loading model from cache C:\Users\ADMINI~1\AppData\Local\Temp\jieba.cache
Loading model cost 0.748 seconds.
Prefix dict has been built successfully.


In [16]:
data[['item_name_cut']].head()

Unnamed: 0,item_name_cut
0,"[CHANDO, /, 自然, 堂, , 雪域, 精粹, 纯粹, 滋润霜, 50g, ,..."
1,"[CHANDO, /, 自然, 堂, 凝, 时鲜, 颜肌活, 乳液, 120ML, , 淡..."
2,"[CHANDO, /, 自然, 堂, 活泉, 保湿, 修护, 精华, 水, （, 滋润, 型..."
3,"[CHANDO, /, 自然, 堂, , 男士, 劲爽, 控油, 洁面膏, , 100g..."
4,"[CHANDO, /, 自然, 堂, 雪域, 精粹, 纯粹, 滋润霜, （, 清爽型, ）,..."


### 构建商品类目（添加主类别、次类别）

In [17]:
basic_config_data = """护肤品	套装	套装							
护肤品	乳液类	乳液	美白乳	润肤乳	凝乳	柔肤液	亮肤乳	菁华乳	修护乳
护肤品	眼部护理	眼霜	眼部精华	眼膜					
护肤品	面膜类	面膜													
护肤品	清洁类	洗面	洁面	清洁	卸妆	洁颜	洗颜	去角质	磨砂						
护肤品	化妆水	化妆水	爽肤水	柔肤水	补水露	凝露	柔肤液	精粹水	亮肤水	润肤水	保湿水	菁华水	保湿喷雾	舒缓喷雾
护肤品	面霜类	面霜	日霜	晚霜	柔肤霜	滋润霜	保湿霜	凝霜	日间霜	晚间霜	乳霜	修护霜	亮肤霜	底霜	菁华霜
护肤品	精华类	精华液	精华水	精华露	精华素										
护肤品	防晒类	防晒霜	防晒喷雾												
化妆品	口红类	唇釉	口红	唇彩											
化妆品	底妆类	散粉	蜜粉	粉底液	定妆粉 	气垫	粉饼	BB	CC	遮瑕	粉霜	粉底膏	粉底霜		
化妆品	眼部彩妆	眉粉	染眉膏	眼线	眼影	睫毛膏									
化妆品	修容类	鼻影	修容粉	高光	腮红										
其他	其他	其他"""

category_config_map = {}

for each in basic_config_data.split('\n'):
    line_list = each.strip('\t').split('\t')
    #print(line_list)
    for key in line_list[2:]:
        #print(key)
        #print(tuple(line_list[:2]))
        category_config_map[key] = tuple(line_list[:2])
       
category_config_map

{'套装': ('护肤品', '套装'),
 '乳液': ('护肤品', '乳液类'),
 '美白乳': ('护肤品', '乳液类'),
 '润肤乳': ('护肤品', '乳液类'),
 '凝乳': ('护肤品', '乳液类'),
 '柔肤液': ('护肤品', '化妆水'),
 '亮肤乳': ('护肤品', '乳液类'),
 '菁华乳': ('护肤品', '乳液类'),
 '修护乳': ('护肤品', '乳液类'),
 '眼霜': ('护肤品', '眼部护理'),
 '眼部精华': ('护肤品', '眼部护理'),
 '眼膜': ('护肤品', '眼部护理'),
 '面膜': ('护肤品', '面膜类'),
 '洗面': ('护肤品', '清洁类'),
 '洁面': ('护肤品', '清洁类'),
 '清洁': ('护肤品', '清洁类'),
 '卸妆': ('护肤品', '清洁类'),
 '洁颜': ('护肤品', '清洁类'),
 '洗颜': ('护肤品', '清洁类'),
 '去角质': ('护肤品', '清洁类'),
 '磨砂': ('护肤品', '清洁类'),
 '化妆水': ('护肤品', '化妆水'),
 '爽肤水': ('护肤品', '化妆水'),
 '柔肤水': ('护肤品', '化妆水'),
 '补水露': ('护肤品', '化妆水'),
 '凝露': ('护肤品', '化妆水'),
 '精粹水': ('护肤品', '化妆水'),
 '亮肤水': ('护肤品', '化妆水'),
 '润肤水': ('护肤品', '化妆水'),
 '保湿水': ('护肤品', '化妆水'),
 '菁华水': ('护肤品', '化妆水'),
 '保湿喷雾': ('护肤品', '化妆水'),
 '舒缓喷雾': ('护肤品', '化妆水'),
 '面霜': ('护肤品', '面霜类'),
 '日霜': ('护肤品', '面霜类'),
 '晚霜': ('护肤品', '面霜类'),
 '柔肤霜': ('护肤品', '面霜类'),
 '滋润霜': ('护肤品', '面霜类'),
 '保湿霜': ('护肤品', '面霜类'),
 '凝霜': ('护肤品', '面霜类'),
 '日间霜': ('护肤品', '面霜类'),
 '晚间霜': ('护肤品', '面霜类'),
 '乳霜'

In [18]:
def get_type(title_split):
    for word in title_split:
        if word in category_config_map:
            return category_config_map[word]
    return category_config_map['其他']
category_config_map['高光']


('化妆品', '修容类')

In [19]:
#添加主类别、子类别
types = data['item_name_cut'].apply(get_type)
data['types'] = types 
data['main_type'] = types.str[0]
data['sub_type'] = types.str[1]
data.drop(columns = "types",inplace =True)

In [20]:
data.sample(20)

Unnamed: 0,update_time,id,title,price,sale_count,comment_count,brand,item_name_cut,main_type,sub_type
15522,2016-11-12,A526115151470,L'OREAL欧莱雅男士护肤激能三件套 洁面+水凝露+精华露,249.0,9606.0,2313.0,欧莱雅,"[L, ', OREAL, 欧莱雅, 男士, 护肤, 激能, 三件套, , 洁面, +, ...",护肤品,清洁类
23448,2016-11-06,A520655216584,兰蔻 唇膏口红迷恋丝缎唇膏3.4g 保湿持久显色滋养双唇,270.0,8327.0,940.0,兰蔻,"[兰蔻, , , 唇膏, 口红, 迷恋, 丝缎, 唇膏, 3.4, g, , 保湿, ...",化妆品,口红类
23734,2016-11-14,A540682405638,【娇兰】幻彩流星彩妆刷定妆刷散粉刷 幻彩流星粉球必备搭档,310.0,24.0,0.0,娇兰,"[【, 娇兰, 】, 幻彩, 流星, 彩妆, 刷, 定妆, 刷散, 粉刷, , 幻彩, 流...",其他,其他
20527,2016-11-13,A12727688676,美宝莲眼唇卸妆液 脸部眼部及唇部卸妆油卸妆水温和清爽深层清洁,60.0,493497.0,22544.0,美宝莲,"[美宝莲, 眼唇, 卸妆液, , 脸部, 眼部, 及, 唇部, 卸妆油, 卸妆水, 温和,...",护肤品,清洁类
672,2016-11-09,A539756246009,CHANDO/自然堂自然堂雪域精粹纯粹滋润乳液礼装组合 补水保湿滋润,158.0,231.0,76.0,自然堂,"[CHANDO, /, 自然, 堂, 自然, 堂, 雪域, 精粹, 纯粹, 滋润, 乳液, ...",护肤品,乳液类
1063,2016-11-06,A540001187127,CHANDO/自然堂凝润滋养护唇膏两只装 持久滋润 润泽肌肤 保湿唇膏,65.0,79.0,22.0,自然堂,"[CHANDO, /, 自然, 堂凝润, 滋养, 护唇膏, 两只, 装, , 持久, 滋润...",其他,其他
12960,2016-11-08,A18413490530,Clinique倩碧净彻爽肤水200ml 男士护肤洁肤化妆水 温和去角质,190.0,1832.0,190.0,倩碧,"[Clinique, 倩碧净彻, 爽肤水, 200ml, , 男士, 护肤, 洁肤, 化妆...",护肤品,化妆水
15240,2016-11-13,A7901269404,L'OREAL欧莱雅可丝莹温和染发霜 染发剂 长效护发滋润,69.0,25083.0,704.0,欧莱雅,"[L, ', OREAL, 欧莱雅, 可丝莹, 温和, 染发, 霜, , 染发剂, , ...",其他,其他
7592,2016-11-14,A38637185952,【新享价】雅诗兰黛红石榴水红石榴能量水200ml 滋润型补水爽肤水,420.0,14121.0,1270.0,雅诗兰黛,"[【, 新, 享价, 】, 雅诗兰黛, 红, 石榴, 水红, 石榴, 能量, 水, 200m...",护肤品,化妆水
25713,2016-11-10,A520977560720,Herborist/佰草集男仕清爽控油液体皂150g男士平衡控油清洁洁面,120.0,1848.0,275.0,佰草集,"[Herborist, /, 佰草集, 男仕, 清爽, 控油, 液体, 皂, 150g, 男...",护肤品,清洁类


In [21]:
#添加列：是否为男士专用
data['man_only'] = data['title'].apply(lambda x: '是' if '男士' in x and '女士' not in x else '否')
data.sample(5) 

Unnamed: 0,update_time,id,title,price,sale_count,comment_count,brand,item_name_cut,main_type,sub_type,man_only
7111,2016-11-11,A520789046377,雅漾 清透美白乳50ml 补水滋养 深层保湿 提亮肤色 清爽轻盈,280.0,1365.0,230.0,雅漾,"[雅漾, , 清透, 美白乳, 50ml, , 补水, 滋养, , 深层, 保湿, ...",护肤品,乳液类,否
23473,2016-11-06,A527342242920,【11-11预售】兰蔻菁纯臻颜玫瑰愈颜霜 润养修护受损肌肤,2680.0,289.0,36.0,兰蔻,"[【, 11, -, 11, 预售, 】, 兰蔻菁, 纯臻颜, 玫瑰, 愈颜霜, , 润养...",其他,其他,否
17676,2016-11-09,A36294342552,德国进口 2支包邮*妮维雅男女润唇膏唇膜保湿滋润淡化唇纹SPF15,34.99,26062.0,2523.0,妮维雅,"[德国, 进口, , 2, 支包, 邮, *, 妮维雅, 男女, 润唇膏, 唇膜, 保湿,...",其他,其他,否
17628,2016-11-09,A17309357968,德国妮维雅男士水活多效润肤露乳液补水滋润保湿护肤提亮,48.99,33367.0,980.0,妮维雅,"[德国, 妮维雅, 男士, 水活, 多效, 润肤露, 乳液, 补水, 滋润, 保湿, 护肤,...",护肤品,乳液类,是
5622,2016-11-05,A43278549432,innisfree/悦诗风吟山茶花菁华修护润发乳200ml 无硅油,80.0,1094.0,87.0,悦诗风吟,"[innisfree, /, 悦诗, 风吟, 山茶花, 菁华, 修护, 润, 发乳, 200...",其他,其他,否


In [22]:
# 添加销售额列
data['sale_money'] = data['price']*data['sale_count']
#添加时间‘天’
data['day'] = data['update_time'].dt.day
# 删除'item_name_cut'
del data['item_name_cut']
# 重置索引
data.reset_index(drop = True, inplace = True)
data.sample(10)

Unnamed: 0,update_time,id,title,price,sale_count,comment_count,brand,main_type,sub_type,man_only,sale_money,day
21484,2016-11-06,A520947187116,【11-11预售】兰蔻美肤修护乳液100ml+美肤美容液200ml水润保湿,1285.0,2992.0,283.0,兰蔻,护肤品,乳液类,否,3844720.0,6
24060,2016-11-09,A523780360913,Herborist/佰草集全天候焕肤保湿面膜120ml,180.0,298.0,39.0,佰草集,护肤品,面膜类,否,53640.0,9
22149,2016-11-10,A540685354480,【品牌团】娇兰御廷兰花卓能焕活洁面乳 温和清洁 净化舒缓肌肤,880.0,0.0,0.0,娇兰,护肤品,清洁类,否,0.0,10
16039,2016-11-07,A41337324901,德国妮维雅男士活力劲爽肤水补水保湿控油收毛孔淡化细纹祛痘印,79.0,15272.0,1486.0,妮维雅,护肤品,化妆水,是,1206488.0,7
8123,2016-11-13,A2251610120,正品相宜本草四倍多萃润泽洁面膏深层清洁滋润补水保湿,29.0,225343.0,3888.0,相宜本草,护肤品,清洁类,否,6534947.0,13
6072,2016-11-11,A525788098564,【11-11单品】雅诗兰黛红石榴鲜活亮采面霜 提亮肤色排浊润养,590.0,94.0,2.0,雅诗兰黛,护肤品,面霜类,否,55460.0,11
14816,2016-11-06,A41855390825,L'OREAL欧莱雅清润葡萄籽晚安膜力晶露 补水保湿弹润果冻质地晚霜,160.0,2575.0,233.0,欧莱雅,护肤品,面霜类,否,412000.0,6
476,2016-11-10,A24599364463,自然堂 活泉加倍补水乳霜60g 补水保湿改善肌肤干燥专柜正品包邮,110.0,5618.0,535.0,自然堂,护肤品,面霜类,否,617980.0,10
9317,2016-11-05,A536857288549,正品相宜本草黑茶男士醒肤洁面膏补水保湿护肤清爽控油,39.0,968.0,516.0,相宜本草,其他,其他,是,37752.0,5
6407,2016-11-09,A40174935000,雅诗兰黛化妆刷 腮红刷15号 大号 单支装,400.0,21.0,0.0,雅诗兰黛,化妆品,修容类,否,8400.0,9


In [23]:
data.to_csv('./clean_data.csv')