# 통합 식품영양성분DB 정리
### - [클리닝](#1.-클리닝)
### - [타입 변경(object -> float)](#2.-타입-변경)
### - [데이터 단위 통일(영양소 g으로 통일)](#3.-영양소-별-데이터-단위-통일)
### - [각 식품의 영양소 최대 값 행 추가](#4.-)

In [1]:
import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
import re

In [2]:
food_nutrients = pd.read_excel('통합 식품영양성분DB_20211106.xlsx', skiprows=[0,1,2], engine='openpyxl')
food_nutrients.head()

Unnamed: 0,NO,SAMPLE_ID,식품코드,DB군,상용제품,식품명,연도,지역 / 제조사,채취시기,식품대분류,...,냉산가용성물질(㎎),총 불포화지방산(g),식염상당량(g),회분(g),폐기율(%),가식부(%),산가용성물질(%),카페인(㎎),성분표출처,발행기관
0,1,D000006-94-AVG,D000006,음식,품목대표,꿩불고기,2019,충주,평균,구이류,...,-,-,-,5.8,-,-,-,-,식약처('16) 제4권,식품의약품안전처
1,2,D000007-ZZ-AVG,D000007,음식,품목대표,닭갈비,2019,전국(대표),평균,구이류,...,-,-,-,7.0,-,-,-,-,식약처('16) 제4권,식품의약품안전처
2,3,D000008-66-AVG,D000008,음식,품목대표,닭갈비,2019,춘천,평균,구이류,...,-,-,-,4.5,-,-,-,-,식약처('16) 제4권,식품의약품안전처
3,4,D000009-ZZ-AVG,D000009,음식,품목대표,닭꼬치,2019,전국(대표),평균,구이류,...,-,-,-,1.2176954799497,-,-,-,-,식약처('12) 제1권,식품의약품안전처
4,5,D000010-ZZ-AVG,D000010,음식,품목대표,더덕구이,2019,전국(대표),평균,구이류,...,-,-,-,2.5,-,-,-,-,식약처('17) 제5권,식품의약품안전처


In [3]:
pd.options.display.max_columns = 241
pd.set_option('display.max.colwidth', 50)

food_nutrients.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 58597 entries, 0 to 58596
Columns: 241 entries, NO to 발행기관
dtypes: float64(1), int64(2), object(238)
memory usage: 107.7+ MB


## 1. 클리닝 

#### 필요없는 colum 제거 및 float로 변환하기 위해 데이터 정제

In [4]:
food_nutrients = food_nutrients.drop(['SAMPLE_ID', '식품코드', '연도', '지역 / 제조사',\
                                      '채취시기', '에너지(kj)', '폐기율(%)', '성분표출처', '발행기관'], axis = 1)

In [5]:
food_nutrients.head()

Unnamed: 0,NO,DB군,상용제품,식품명,식품대분류,식품상세분류,1회제공량,내용량_단위,총내용량(g),총내용량(mL),에너지(㎉),수분(g),수분(%),단백질(g),지방(g),지질-가식부 100g당,탄수화물(g),총당류(g),자당(g),포도당(g),과당(g),유당(g),맥아당(g),갈락토오스(g),당알콜(g),에리스리톨(g),총 식이섬유(g),총 식이섬유(mg),총 식이섬유(%),수용성 식이섬유(g),불용성 식이섬유(g),셀룰로오스(%),리그닌(%),칼슘(㎎),철(㎎),철(㎍),마그네슘(㎎),인(㎎),칼륨(g),칼륨(㎎),나트륨(㎎),아연(㎎),구리(㎎),구리(㎍),망간(㎎),망간(㎍),셀레늄(㎍),몰리브덴(㎍),요오드(㎍),염소(㎎),비타민 A(㎍),비타민 A(㎍ RE),레티놀(㎍),베타카로틴(㎍),레티놀A효능,비타민 D(D2+D3)(㎍),비타민 D2(㎍),비타민 D3(㎍),비타민 D1(㎍),비타민 E(㎎),비타민 E(㎎ α-TE),알파 토코페롤(㎎),베타 토코페롤(㎎),감마 토코페롤(㎎),델타 토코페롤(㎎),알파 토코트리에놀(㎎),베타 토코트리에놀(㎎),감마 토코트리에놀(㎎),델타 토코트리에놀(㎎),토코페롤(㎎),토코트리에놀(㎎),비타민 K(㎎),비타민 K(㎍),비타민 K1(㎍),비타민 K2(㎍),비타민 B1(㎎),비타민 B1(㎍),비타민 B2(㎎),비타민 B2(㎍),나이아신(㎎),나이아신(㎎ NE),나이아신(NE)(㎎),나이아신(NE)(㎎ NE),니코틴산 (㎎),니코틴아마이드(㎎),판토텐산(㎎),판토텐산(㎍),비타민 B6(㎎),비타민 B6(㎍),피리독신(㎎),비오틴(㎍),엽산(DFE)(㎍),엽산 - 천연 엽산(㎍),엽산 - 합성 엽산(㎍),비타민 B12(㎎),비타민 B12(㎍),비타민 C(g),비타민 C(㎎),콜린(g),콜린(㎎),총 아미노산(g),총 아미노산(㎎),필수 아미노산(㎎),이소류신(㎎),류신(㎎),라이신(㎎),메티오닌(㎎),페닐알라닌(㎎),트레오닌(㎎),트립토판(㎎),발린(㎎),히스티딘(㎎),아르기닌(㎎),비필수 아미노산(㎎),티로신(㎎),시스테인(㎎),알라닌(㎎),아스파르트산(㎎),글루탐산(㎎),글리신(㎎),프롤린(㎎),세린(㎎),타우린(㎎),글리신 베타인 (㎎),호마린(㎎),트리고넬린(㎎),리보핵산(㎎),데옥시리보핵산(㎎),콜레스테롤(g),콜레스테롤(㎎),총 지방산(g),총 필수 지방산(g),총 포화 지방산(g),총 포화 지방산(%),부티르산(4:0)(g),부티르산(4:0)(㎎),카프로산(6:0)(g),카프로산(6:0)(㎎),카프릴산(8:0)(g),카프릴산(8:0)(㎎),카프르산(10:0)(g),카프르산(10:0)(㎎),라우르산(12:0)(g),라우르산(12:0)(㎎),라우르산(12:0)(%),트라이데칸산(13:0)(㎎),미리스트산(14:0)(g),미리스트산(14:0)(㎎),미리스트산(14:0)(%),펜타데칸산(15:0)(㎎),팔미트산(16:0)(g),팔미트산(16:0)(㎎),팔미트산(16:0)(%),헵타데칸산(17:0)(㎎),스테아르산(18:0)(g),스테아르산(18:0)(㎎),스테아르산(18:0)(%),아라키드산(20:0)(g),아라키드산(20:0)(㎎),아라키드산(20:0)(%),헨에이코산산(21:0)(㎎),베헨산(22:0)(㎎),트리코산산(23:0)(㎎),리그노세르산(24:0)(㎎),총 단일 불포화지방산(g),총 단일 불포화지방산(%),미리스톨레산(14:1)(g),미리스톨레산(14:1)(㎎),미리스톨레산(14:1)(%),팔미톨레산(16:1)(g),팔미톨레산(16:1)(㎎),팔미톨레산(16:1)(%),헵타데센산(17:1)(㎎),올레산(18:1(n-9))(g),올레산(18:1(n-9))(㎎),올레산(18:1(n-9))(%),박센산(18:1(n-7))(g),박센산(18:1(n-7))(㎎),가돌레산(20:1)(g),가돌레산(20:1)(㎎),가돌레산(20:1)(%),에루크산(22:1)(㎎),에루크산(22:1)(%),네르본산(24:1)(㎎),총 다중 불포화지방산(g),총 다중 불포화지방산(%),리놀레산(18:2(n-6)c)(g),리놀레산(18:2(n-6)c)(㎎),리놀레산(18:2(n-6)c)(%),알파 리놀렌산(18:3(n-3))(g),알파 리놀렌산(18:3(n-3))(㎎),리놀렌산(18:3(n-3)(%),감마 리놀렌산(18:3(n-6))(g),감마 리놀렌산(18:3(n-6))(㎎),스테아리돈산(18:4)(%),에이코사디에노산(20:2(n-6))(g),에이코사디에노산(20:2(n-6))(㎎),에이코사트리에노산(20:3(n-3))(㎎),에이코사트리에노산(20:3(n-6))(g),에이코사트리에노산(20:3(n-6))(㎎),아라키돈산(20:4(n-6))(g),아라키돈산(20:4(n-6))(㎎),아라키돈산(20:4(n-6))(%),에이코사테트라에노산(20:4(n-3))(㎎),에이코사펜타에노산(20:5(n-3))(g),에이코사펜타에노산(20:5(n-3))(㎎),에이코사펜타에노산(20:5(n-3))(%),도코사디에노산(22:2)(㎎),도코사펜타에노산(22:5(n-3))(g),도코사펜타에노산(22:5(n-3))(㎎),도코사펜타에노산(22:5(n-3))(%),도코사헥사에노산(22:6(n-3))(g),도코사헥사에노산(22:6(n-3))(㎎),도코사헥사에노산(22:6(n-3))(%),EPA와 DHA의 합(㎎),오메가 3 지방산(g),오메가 6 지방산(g),트랜스 지방산(g),트랜스 올레산(18:1(n-9)t)(g),트랜스 올레산(18:1(n-9)t)(㎎),트랜스 리놀레산 (18:2t)(g),트랜스 리놀레산 (18:2t)(㎎),트랜스 리놀렌산(18:3t)(g),트랜스 리놀렌산(18:3t)(㎎),트랜스 리놀렌산(18:3t)(%),냉산가용성물질(㎎),총 불포화지방산(g),식염상당량(g),회분(g),가식부(%),산가용성물질(%),카페인(㎎)
0,1,음식,품목대표,꿩불고기,구이류,육류구이,500.0,g,-,-,368.8,412.6,-,33.5,8.5,-,39.7,16.9,7.2,2.8,2.8,0.7,3.5,-,-,-,9.8,-,-,-,-,-,-,105.61,-,4.0,85.39,458.05,-,1243.12,1264.31,3.99,0.32,-,0.68,-,47.55,-,-,-,-,-,0.0,1424.58,-,-,-,-,-,-,-,-,-,-,-,-,-,-,-,8.73,0.06,-,-,-,-,0.0,-,0.33,-,3.61,-,-,-,-,-,-,-,-,-,-,-,63.13,-,-,-,0.0,-,2.99,-,-,-,-,-,1284.37582123574,2328.59892766839,2484.75047814224,645.190070073169,1274.92730261488,1410.84127771718,-,1367.68831341948,848.539312406619,2205.5847774439,-,919.805669181432,276.498720836072,1642.38119022329,2781.77304833044,4784.60634708081,1419.92479570739,1092.29548260871,1264.95795056827,-,-,-,-,-,-,-,106.18,-,-,1.9,-,0,-,0,-,0,-,0.0,-,0.0071148347196189,-,-,-,0.0317835536096363,-,-,-,1.28384114493856,-,-,-,0.527395267901326,-,-,0.0290123491481805,-,-,-,-,-,-,-,-,0.0,-,-,0.0813516573054785,-,-,-,2.30772104748742,-,-,0.113462530850897,-,0.0279762322988018,-,-,-,-,-,-,-,3.23601791813763,-,-,0.656722581376586,-,-,0.018708284652282,-,-,0.0066488700771641,-,-,0.0,-,0.142840481460645,-,-,-,0.0,-,-,-,0.0,-,-,0.0234269823295255,-,-,-,-,-,0.1,0.018116327971628,-,0.0534160839712029,-,0.0,-,-,-,-,-,5.8,-,-,-
1,2,음식,품목대표,닭갈비,구이류,육류구이,400.0,g,-,-,595.61,276.4,-,45.9,25.8,-,44.9,21.2,3.6,5.9,4.8,0.0,6.9,-,-,-,11.6,-,-,-,-,-,-,98.64,-,3.38,104.42,505.25,-,1200.24,1535.83,3.55,0.34,-,0.97,-,57.56,-,-,-,-,-,38.61,2133.37,-,-,-,-,-,-,-,-,-,-,-,-,-,-,-,6.82,0.04,-,-,-,-,0.24,-,0.37,-,1.23,-,-,-,-,-,-,-,-,-,-,-,108.13,-,-,-,1.12,-,5.54,-,-,-,-,-,1796.24151075719,3245.40464371184,3593.31213240036,878.040312336548,1830.14127194101,2019.9394227759,-,1966.31473590112,1198.58224877347,2851.72274483,-,1310.51326329693,307.730115350377,2465.1998212526,4361.76110854525,7778.83843669619,2230.07868308554,1865.82488189018,1833.38617767634,-,-,-,-,-,-,-,193.4,-,-,6.0,-,0,-,0,-,0,-,0.0016983071768326,-,0.0317943799610758,-,-,-,0.179374770348105,-,-,-,4.48483692256034,-,-,-,1.27094632800629,-,-,0.031974799247989,-,-,-,-,-,-,-,-,0.0505025093215654,-,-,1.29026338814361,-,-,-,8.11557700814867,-,-,0.464755835992049,-,0.0821514653597206,-,-,-,-,-,-,-,4.85129439150118,-,-,0.443452616478064,-,-,0.0207316688429758,-,-,0.0266817256973322,-,-,0.0403311208335205,-,0.127788794975451,-,-,-,0.0061434614772668,-,-,-,0.0157059786402594,-,-,0.009782043963298,-,-,-,-,-,0.2,0.0750485023295658,-,0.0646068457814869,-,0.0132108495883938,-,-,-,-,-,7.0,-,-,-
2,3,음식,품목대표,닭갈비,구이류,육류구이,300.0,g,-,-,558.47,195.4,-,45.5,31.6,-,23.1,8.5,0.6,3.2,3.2,0.0,1.5,-,-,-,6.6,-,-,-,-,-,-,63.06,-,2.5,77.07,421.66,-,818.11,1016.94,3.59,0.24,-,0.41,-,51.18,-,-,-,-,-,75.14,493.75,-,-,-,-,-,-,-,-,-,-,-,-,-,-,-,3.58,0.23,-,-,-,-,0.22,-,0.38,-,2.96,-,-,-,-,-,-,-,-,-,-,-,57.96,-,-,-,0.0,-,0.0,-,-,-,-,-,1573.21753798369,3050.29862457744,3210.68973583949,970.590434447847,1783.35498660556,1873.14258889463,-,1707.20801010628,1133.53318735682,2818.65089446732,-,1287.47986619809,291.023739849734,2198.62200139702,3872.9985009794,6674.56898794857,2274.23989275482,1743.25535236687,1763.98161157487,-,-,-,-,-,-,-,217.67,-,-,11.3,-,0,-,0,-,0,-,0.0107353033878382,-,0.0657545977594388,-,-,-,0.349752418213963,-,-,-,8.66193859774305,-,-,-,2.13967909709909,-,-,0.035596334339806,-,-,-,-,-,-,-,-,0.10592332578478,-,-,2.22518721845149,-,-,-,13.8613266734469,-,-,0.767247543668996,-,0.141926417099115,-,-,-,-,-,-,-,5.43422559032569,-,-,0.390665541261449,-,-,0.0564227915888111,-,-,0.0497288641098893,-,-,0.0520810636551763,-,0.1626478800835,-,-,-,0.0108231002425958,-,-,-,0.0221575851175747,-,-,0.0160329856288409,-,-,-,-,-,0.3,0.140151166523609,-,0.0784323811375729,-,0.0319701885707348,-,-,-,-,-,4.5,-,-,-
3,4,음식,품목대표,닭꼬치,구이류,육류구이,70.0,g,-,-,176.722661137077,35.3079065997919,-,11.561723041353,8.56501389120873,-,13.3476609876966,3.15210668563089,0.106114460794218,0.816880663046302,1.63997930717926,0.0,0.589132254611108,-,-,-,2.07170833333333,-,-,-,-,-,-,17.6750468292727,-,7.63691788880754,0.0,122.798123571596,-,152.663030000484,286.911027516294,0.0,0.0,-,0.0,-,0.0,-,-,-,-,-,14.7534711264017,46.097313453717,-,-,-,-,-,-,-,-,-,-,-,-,-,-,-,0.0,0.0,-,-,-,-,0.226146222103857,-,0.18408413082574,-,1.71325274082621,-,-,-,-,-,-,-,-,-,-,-,0.0,-,-,-,0.0,-,0.0,-,-,-,-,-,0.0,0.0,0.0,0.0,0.0,0.0,-,0.0,0.0,0.0,-,-,0.0,0.0,0.0,0.0,0.0,0.0,0.0,-,-,-,-,-,-,-,31.4437176472469,-,-,2.31532784916834,-,0,-,0,-,0,-,0.0,-,0.0,-,-,-,0.1,-,-,-,1.8,-,-,-,0.5,-,-,0.0,-,-,-,-,-,-,-,-,0.0,-,-,0.4,-,-,-,3.3,-,-,0.2,-,0.0,-,-,-,-,-,-,-,1.9,-,-,0.2,-,-,0.0,-,-,0.0,-,-,0.0,-,0.0,-,-,-,0.0,-,-,-,0.0,-,-,0.0,-,-,-,-,-,0.0438631942105014,0.0,-,0.0,-,0.0,-,-,-,-,-,1.2176954799497,-,-,-
4,5,음식,품목대표,더덕구이,구이류,채소류구이,100.0,g,-,-,184.0,58.1,-,3.1,5.2,-,31.1,11.6,2.2,2.7,1.5,0.0,5.1,-,-,-,6.8,-,-,-,-,-,-,46.42,-,1.43,38.21,88.17,-,262.44,743.37,0.59,0.13,-,0.42,-,0.0,-,-,-,-,-,0.0,481.44,-,-,-,-,-,-,-,-,-,-,-,-,-,-,-,3.89,1.47,-,-,-,-,0.23,-,0.08,-,0.18,-,-,-,-,-,-,-,-,-,-,-,16.77,-,-,-,0.0,-,1.34,-,-,-,-,-,69.84,126.53,90.72,16.36,82.78,70.97,-,87.91,44.56,457.03,-,33.86,9.73,91.19,203.15,620.8,83.58,117.2,83.49,-,-,-,-,-,-,-,0.12,-,-,0.8,-,0,-,0,-,0,-,0.0,-,0.0,-,-,-,0.0,-,-,-,0.5,-,-,-,0.2,-,-,0.0,-,-,-,-,-,-,-,-,0.0,-,-,0.0,-,-,-,1.3,-,-,0.1,-,0.0,-,-,-,-,-,-,-,2.3,-,-,0.4,-,-,0.0,-,-,0.0,-,-,0.0,-,0.0,-,-,-,0.0,-,-,-,0.0,-,-,0.0,-,-,-,-,-,0.0,0.0,-,0.0,-,0.0,-,-,-,-,-,2.5,-,-,-


In [6]:
food_nutrients_copy = food_nutrients.copy()
food_nutrients_copy.loc[: ,'단백질(g)':'카페인(㎎)'] = food_nutrients.loc[: ,'단백질(g)':'카페인(㎎)'].replace(['-', 'tr', 'Tr'], 0)

In [7]:
food_nutrients_copy.loc[: ,'단백질(g)':'카페인(㎎)'] = \
        food_nutrients_copy.loc[: ,'단백질(g)':'카페인(㎎)'].replace(re.compile(r'미만'), 0)
food_nutrients_copy.loc[: ,'단백질(g)':'카페인(㎎)'] = \
        food_nutrients_copy.loc[: ,'단백질(g)':'카페인(㎎)'].replace(re.compile(r'이하'), 0)
food_nutrients_copy.loc[: ,'단백질(g)':'카페인(㎎)'] = \
        food_nutrients_copy.loc[: ,'단백질(g)':'카페인(㎎)'].replace(re.compile(r'<'), 0)

food_nutrients_copy.head()

Unnamed: 0,NO,DB군,상용제품,식품명,식품대분류,식품상세분류,1회제공량,내용량_단위,총내용량(g),총내용량(mL),에너지(㎉),수분(g),수분(%),단백질(g),지방(g),지질-가식부 100g당,탄수화물(g),총당류(g),자당(g),포도당(g),과당(g),유당(g),맥아당(g),갈락토오스(g),당알콜(g),에리스리톨(g),총 식이섬유(g),총 식이섬유(mg),총 식이섬유(%),수용성 식이섬유(g),불용성 식이섬유(g),셀룰로오스(%),리그닌(%),칼슘(㎎),철(㎎),철(㎍),마그네슘(㎎),인(㎎),칼륨(g),칼륨(㎎),나트륨(㎎),아연(㎎),구리(㎎),구리(㎍),망간(㎎),망간(㎍),셀레늄(㎍),몰리브덴(㎍),요오드(㎍),염소(㎎),비타민 A(㎍),비타민 A(㎍ RE),레티놀(㎍),베타카로틴(㎍),레티놀A효능,비타민 D(D2+D3)(㎍),비타민 D2(㎍),비타민 D3(㎍),비타민 D1(㎍),비타민 E(㎎),비타민 E(㎎ α-TE),알파 토코페롤(㎎),베타 토코페롤(㎎),감마 토코페롤(㎎),델타 토코페롤(㎎),알파 토코트리에놀(㎎),베타 토코트리에놀(㎎),감마 토코트리에놀(㎎),델타 토코트리에놀(㎎),토코페롤(㎎),토코트리에놀(㎎),비타민 K(㎎),비타민 K(㎍),비타민 K1(㎍),비타민 K2(㎍),비타민 B1(㎎),비타민 B1(㎍),비타민 B2(㎎),비타민 B2(㎍),나이아신(㎎),나이아신(㎎ NE),나이아신(NE)(㎎),나이아신(NE)(㎎ NE),니코틴산 (㎎),니코틴아마이드(㎎),판토텐산(㎎),판토텐산(㎍),비타민 B6(㎎),비타민 B6(㎍),피리독신(㎎),비오틴(㎍),엽산(DFE)(㎍),엽산 - 천연 엽산(㎍),엽산 - 합성 엽산(㎍),비타민 B12(㎎),비타민 B12(㎍),비타민 C(g),비타민 C(㎎),콜린(g),콜린(㎎),총 아미노산(g),총 아미노산(㎎),필수 아미노산(㎎),이소류신(㎎),류신(㎎),라이신(㎎),메티오닌(㎎),페닐알라닌(㎎),트레오닌(㎎),트립토판(㎎),발린(㎎),히스티딘(㎎),아르기닌(㎎),비필수 아미노산(㎎),티로신(㎎),시스테인(㎎),알라닌(㎎),아스파르트산(㎎),글루탐산(㎎),글리신(㎎),프롤린(㎎),세린(㎎),타우린(㎎),글리신 베타인 (㎎),호마린(㎎),트리고넬린(㎎),리보핵산(㎎),데옥시리보핵산(㎎),콜레스테롤(g),콜레스테롤(㎎),총 지방산(g),총 필수 지방산(g),총 포화 지방산(g),총 포화 지방산(%),부티르산(4:0)(g),부티르산(4:0)(㎎),카프로산(6:0)(g),카프로산(6:0)(㎎),카프릴산(8:0)(g),카프릴산(8:0)(㎎),카프르산(10:0)(g),카프르산(10:0)(㎎),라우르산(12:0)(g),라우르산(12:0)(㎎),라우르산(12:0)(%),트라이데칸산(13:0)(㎎),미리스트산(14:0)(g),미리스트산(14:0)(㎎),미리스트산(14:0)(%),펜타데칸산(15:0)(㎎),팔미트산(16:0)(g),팔미트산(16:0)(㎎),팔미트산(16:0)(%),헵타데칸산(17:0)(㎎),스테아르산(18:0)(g),스테아르산(18:0)(㎎),스테아르산(18:0)(%),아라키드산(20:0)(g),아라키드산(20:0)(㎎),아라키드산(20:0)(%),헨에이코산산(21:0)(㎎),베헨산(22:0)(㎎),트리코산산(23:0)(㎎),리그노세르산(24:0)(㎎),총 단일 불포화지방산(g),총 단일 불포화지방산(%),미리스톨레산(14:1)(g),미리스톨레산(14:1)(㎎),미리스톨레산(14:1)(%),팔미톨레산(16:1)(g),팔미톨레산(16:1)(㎎),팔미톨레산(16:1)(%),헵타데센산(17:1)(㎎),올레산(18:1(n-9))(g),올레산(18:1(n-9))(㎎),올레산(18:1(n-9))(%),박센산(18:1(n-7))(g),박센산(18:1(n-7))(㎎),가돌레산(20:1)(g),가돌레산(20:1)(㎎),가돌레산(20:1)(%),에루크산(22:1)(㎎),에루크산(22:1)(%),네르본산(24:1)(㎎),총 다중 불포화지방산(g),총 다중 불포화지방산(%),리놀레산(18:2(n-6)c)(g),리놀레산(18:2(n-6)c)(㎎),리놀레산(18:2(n-6)c)(%),알파 리놀렌산(18:3(n-3))(g),알파 리놀렌산(18:3(n-3))(㎎),리놀렌산(18:3(n-3)(%),감마 리놀렌산(18:3(n-6))(g),감마 리놀렌산(18:3(n-6))(㎎),스테아리돈산(18:4)(%),에이코사디에노산(20:2(n-6))(g),에이코사디에노산(20:2(n-6))(㎎),에이코사트리에노산(20:3(n-3))(㎎),에이코사트리에노산(20:3(n-6))(g),에이코사트리에노산(20:3(n-6))(㎎),아라키돈산(20:4(n-6))(g),아라키돈산(20:4(n-6))(㎎),아라키돈산(20:4(n-6))(%),에이코사테트라에노산(20:4(n-3))(㎎),에이코사펜타에노산(20:5(n-3))(g),에이코사펜타에노산(20:5(n-3))(㎎),에이코사펜타에노산(20:5(n-3))(%),도코사디에노산(22:2)(㎎),도코사펜타에노산(22:5(n-3))(g),도코사펜타에노산(22:5(n-3))(㎎),도코사펜타에노산(22:5(n-3))(%),도코사헥사에노산(22:6(n-3))(g),도코사헥사에노산(22:6(n-3))(㎎),도코사헥사에노산(22:6(n-3))(%),EPA와 DHA의 합(㎎),오메가 3 지방산(g),오메가 6 지방산(g),트랜스 지방산(g),트랜스 올레산(18:1(n-9)t)(g),트랜스 올레산(18:1(n-9)t)(㎎),트랜스 리놀레산 (18:2t)(g),트랜스 리놀레산 (18:2t)(㎎),트랜스 리놀렌산(18:3t)(g),트랜스 리놀렌산(18:3t)(㎎),트랜스 리놀렌산(18:3t)(%),냉산가용성물질(㎎),총 불포화지방산(g),식염상당량(g),회분(g),가식부(%),산가용성물질(%),카페인(㎎)
0,1,음식,품목대표,꿩불고기,구이류,육류구이,500.0,g,-,-,368.8,412.6,-,33.5,8.5,0,39.7,16.9,7.2,2.8,2.8,0.7,3.5,0,0,0,9.8,0,0,0,0,0,0,105.61,0,4.0,85.39,458.05,0,1243.12,1264.31,3.99,0.32,0,0.68,0,47.55,0,0,0,0,0,0.0,1424.58,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,8.73,0.06,0,0,0,0,0.0,0,0.33,0,3.61,0,0,0,0,0,0,0,0,0,0,0,63.13,0,0,0,0.0,0,2.99,0,0,0,0,0,1284.37582123574,2328.59892766839,2484.75047814224,645.190070073169,1274.92730261488,1410.84127771718,0,1367.68831341948,848.539312406619,2205.5847774439,0,919.805669181432,276.498720836072,1642.38119022329,2781.77304833044,4784.60634708081,1419.92479570739,1092.29548260871,1264.95795056827,0,0,0,0,0,0,0,106.18,0,0,1.9,0,0,0,0,0,0,0,0.0,0,0.0071148347196189,0,0,0,0.0317835536096363,0,0,0,1.28384114493856,0,0,0,0.527395267901326,0,0,0.0290123491481805,0,0,0,0,0,0,0,0,0.0,0,0,0.0813516573054785,0,0,0,2.30772104748742,0,0,0.113462530850897,0,0.0279762322988018,0,0,0,0,0,0,0,3.23601791813763,0,0,0.656722581376586,0,0,0.018708284652282,0,0,0.0066488700771641,0,0,0.0,0,0.142840481460645,0,0,0,0.0,0,0,0,0.0,0,0,0.0234269823295255,0,0,0,0,0,0.1,0.018116327971628,0,0.0534160839712029,0,0.0,0,0,0,0,0,5.8,0,0,0
1,2,음식,품목대표,닭갈비,구이류,육류구이,400.0,g,-,-,595.61,276.4,-,45.9,25.8,0,44.9,21.2,3.6,5.9,4.8,0.0,6.9,0,0,0,11.6,0,0,0,0,0,0,98.64,0,3.38,104.42,505.25,0,1200.24,1535.83,3.55,0.34,0,0.97,0,57.56,0,0,0,0,0,38.61,2133.37,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,6.82,0.04,0,0,0,0,0.24,0,0.37,0,1.23,0,0,0,0,0,0,0,0,0,0,0,108.13,0,0,0,1.12,0,5.54,0,0,0,0,0,1796.24151075719,3245.40464371184,3593.31213240036,878.040312336548,1830.14127194101,2019.9394227759,0,1966.31473590112,1198.58224877347,2851.72274483,0,1310.51326329693,307.730115350377,2465.1998212526,4361.76110854525,7778.83843669619,2230.07868308554,1865.82488189018,1833.38617767634,0,0,0,0,0,0,0,193.4,0,0,6.0,0,0,0,0,0,0,0,0.0016983071768326,0,0.0317943799610758,0,0,0,0.179374770348105,0,0,0,4.48483692256034,0,0,0,1.27094632800629,0,0,0.031974799247989,0,0,0,0,0,0,0,0,0.0505025093215654,0,0,1.29026338814361,0,0,0,8.11557700814867,0,0,0.464755835992049,0,0.0821514653597206,0,0,0,0,0,0,0,4.85129439150118,0,0,0.443452616478064,0,0,0.0207316688429758,0,0,0.0266817256973322,0,0,0.0403311208335205,0,0.127788794975451,0,0,0,0.0061434614772668,0,0,0,0.0157059786402594,0,0,0.009782043963298,0,0,0,0,0,0.2,0.0750485023295658,0,0.0646068457814869,0,0.0132108495883938,0,0,0,0,0,7.0,0,0,0
2,3,음식,품목대표,닭갈비,구이류,육류구이,300.0,g,-,-,558.47,195.4,-,45.5,31.6,0,23.1,8.5,0.6,3.2,3.2,0.0,1.5,0,0,0,6.6,0,0,0,0,0,0,63.06,0,2.5,77.07,421.66,0,818.11,1016.94,3.59,0.24,0,0.41,0,51.18,0,0,0,0,0,75.14,493.75,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,3.58,0.23,0,0,0,0,0.22,0,0.38,0,2.96,0,0,0,0,0,0,0,0,0,0,0,57.96,0,0,0,0.0,0,0.0,0,0,0,0,0,1573.21753798369,3050.29862457744,3210.68973583949,970.590434447847,1783.35498660556,1873.14258889463,0,1707.20801010628,1133.53318735682,2818.65089446732,0,1287.47986619809,291.023739849734,2198.62200139702,3872.9985009794,6674.56898794857,2274.23989275482,1743.25535236687,1763.98161157487,0,0,0,0,0,0,0,217.67,0,0,11.3,0,0,0,0,0,0,0,0.0107353033878382,0,0.0657545977594388,0,0,0,0.349752418213963,0,0,0,8.66193859774305,0,0,0,2.13967909709909,0,0,0.035596334339806,0,0,0,0,0,0,0,0,0.10592332578478,0,0,2.22518721845149,0,0,0,13.8613266734469,0,0,0.767247543668996,0,0.141926417099115,0,0,0,0,0,0,0,5.43422559032569,0,0,0.390665541261449,0,0,0.0564227915888111,0,0,0.0497288641098893,0,0,0.0520810636551763,0,0.1626478800835,0,0,0,0.0108231002425958,0,0,0,0.0221575851175747,0,0,0.0160329856288409,0,0,0,0,0,0.3,0.140151166523609,0,0.0784323811375729,0,0.0319701885707348,0,0,0,0,0,4.5,0,0,0
3,4,음식,품목대표,닭꼬치,구이류,육류구이,70.0,g,-,-,176.722661137077,35.3079065997919,-,11.561723041353,8.56501389120873,0,13.3476609876966,3.15210668563089,0.106114460794218,0.816880663046302,1.63997930717926,0.0,0.589132254611108,0,0,0,2.07170833333333,0,0,0,0,0,0,17.6750468292727,0,7.63691788880754,0.0,122.798123571596,0,152.663030000484,286.911027516294,0.0,0.0,0,0.0,0,0.0,0,0,0,0,0,14.7534711264017,46.097313453717,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0.0,0.0,0,0,0,0,0.226146222103857,0,0.18408413082574,0,1.71325274082621,0,0,0,0,0,0,0,0,0,0,0,0.0,0,0,0,0.0,0,0.0,0,0,0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0.0,0.0,0.0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0,0,0,0,0,31.4437176472469,0,0,2.31532784916834,0,0,0,0,0,0,0,0.0,0,0.0,0,0,0,0.1,0,0,0,1.8,0,0,0,0.5,0,0,0.0,0,0,0,0,0,0,0,0,0.0,0,0,0.4,0,0,0,3.3,0,0,0.2,0,0.0,0,0,0,0,0,0,0,1.9,0,0,0.2,0,0,0.0,0,0,0.0,0,0,0.0,0,0.0,0,0,0,0.0,0,0,0,0.0,0,0,0.0,0,0,0,0,0,0.0438631942105014,0.0,0,0.0,0,0.0,0,0,0,0,0,1.2176954799497,0,0,0
4,5,음식,품목대표,더덕구이,구이류,채소류구이,100.0,g,-,-,184.0,58.1,-,3.1,5.2,0,31.1,11.6,2.2,2.7,1.5,0.0,5.1,0,0,0,6.8,0,0,0,0,0,0,46.42,0,1.43,38.21,88.17,0,262.44,743.37,0.59,0.13,0,0.42,0,0.0,0,0,0,0,0,0.0,481.44,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,3.89,1.47,0,0,0,0,0.23,0,0.08,0,0.18,0,0,0,0,0,0,0,0,0,0,0,16.77,0,0,0,0.0,0,1.34,0,0,0,0,0,69.84,126.53,90.72,16.36,82.78,70.97,0,87.91,44.56,457.03,0,33.86,9.73,91.19,203.15,620.8,83.58,117.2,83.49,0,0,0,0,0,0,0,0.12,0,0,0.8,0,0,0,0,0,0,0,0.0,0,0.0,0,0,0,0.0,0,0,0,0.5,0,0,0,0.2,0,0,0.0,0,0,0,0,0,0,0,0,0.0,0,0,0.0,0,0,0,1.3,0,0,0.1,0,0.0,0,0,0,0,0,0,0,2.3,0,0,0.4,0,0,0.0,0,0,0.0,0,0,0.0,0,0.0,0,0,0,0.0,0,0,0,0.0,0,0,0.0,0,0,0,0,0,0.0,0.0,0,0.0,0,0.0,0,0,0,0,0,2.5,0,0,0


#### 중복된 데이터 제거

In [8]:
food_nutrients_copy = food_nutrients_copy.drop_duplicates(['식품명'])

food_nutrients_copy.head()

Unnamed: 0,NO,DB군,상용제품,식품명,식품대분류,식품상세분류,1회제공량,내용량_단위,총내용량(g),총내용량(mL),에너지(㎉),수분(g),수분(%),단백질(g),지방(g),지질-가식부 100g당,탄수화물(g),총당류(g),자당(g),포도당(g),과당(g),유당(g),맥아당(g),갈락토오스(g),당알콜(g),에리스리톨(g),총 식이섬유(g),총 식이섬유(mg),총 식이섬유(%),수용성 식이섬유(g),불용성 식이섬유(g),셀룰로오스(%),리그닌(%),칼슘(㎎),철(㎎),철(㎍),마그네슘(㎎),인(㎎),칼륨(g),칼륨(㎎),나트륨(㎎),아연(㎎),구리(㎎),구리(㎍),망간(㎎),망간(㎍),셀레늄(㎍),몰리브덴(㎍),요오드(㎍),염소(㎎),비타민 A(㎍),비타민 A(㎍ RE),레티놀(㎍),베타카로틴(㎍),레티놀A효능,비타민 D(D2+D3)(㎍),비타민 D2(㎍),비타민 D3(㎍),비타민 D1(㎍),비타민 E(㎎),비타민 E(㎎ α-TE),알파 토코페롤(㎎),베타 토코페롤(㎎),감마 토코페롤(㎎),델타 토코페롤(㎎),알파 토코트리에놀(㎎),베타 토코트리에놀(㎎),감마 토코트리에놀(㎎),델타 토코트리에놀(㎎),토코페롤(㎎),토코트리에놀(㎎),비타민 K(㎎),비타민 K(㎍),비타민 K1(㎍),비타민 K2(㎍),비타민 B1(㎎),비타민 B1(㎍),비타민 B2(㎎),비타민 B2(㎍),나이아신(㎎),나이아신(㎎ NE),나이아신(NE)(㎎),나이아신(NE)(㎎ NE),니코틴산 (㎎),니코틴아마이드(㎎),판토텐산(㎎),판토텐산(㎍),비타민 B6(㎎),비타민 B6(㎍),피리독신(㎎),비오틴(㎍),엽산(DFE)(㎍),엽산 - 천연 엽산(㎍),엽산 - 합성 엽산(㎍),비타민 B12(㎎),비타민 B12(㎍),비타민 C(g),비타민 C(㎎),콜린(g),콜린(㎎),총 아미노산(g),총 아미노산(㎎),필수 아미노산(㎎),이소류신(㎎),류신(㎎),라이신(㎎),메티오닌(㎎),페닐알라닌(㎎),트레오닌(㎎),트립토판(㎎),발린(㎎),히스티딘(㎎),아르기닌(㎎),비필수 아미노산(㎎),티로신(㎎),시스테인(㎎),알라닌(㎎),아스파르트산(㎎),글루탐산(㎎),글리신(㎎),프롤린(㎎),세린(㎎),타우린(㎎),글리신 베타인 (㎎),호마린(㎎),트리고넬린(㎎),리보핵산(㎎),데옥시리보핵산(㎎),콜레스테롤(g),콜레스테롤(㎎),총 지방산(g),총 필수 지방산(g),총 포화 지방산(g),총 포화 지방산(%),부티르산(4:0)(g),부티르산(4:0)(㎎),카프로산(6:0)(g),카프로산(6:0)(㎎),카프릴산(8:0)(g),카프릴산(8:0)(㎎),카프르산(10:0)(g),카프르산(10:0)(㎎),라우르산(12:0)(g),라우르산(12:0)(㎎),라우르산(12:0)(%),트라이데칸산(13:0)(㎎),미리스트산(14:0)(g),미리스트산(14:0)(㎎),미리스트산(14:0)(%),펜타데칸산(15:0)(㎎),팔미트산(16:0)(g),팔미트산(16:0)(㎎),팔미트산(16:0)(%),헵타데칸산(17:0)(㎎),스테아르산(18:0)(g),스테아르산(18:0)(㎎),스테아르산(18:0)(%),아라키드산(20:0)(g),아라키드산(20:0)(㎎),아라키드산(20:0)(%),헨에이코산산(21:0)(㎎),베헨산(22:0)(㎎),트리코산산(23:0)(㎎),리그노세르산(24:0)(㎎),총 단일 불포화지방산(g),총 단일 불포화지방산(%),미리스톨레산(14:1)(g),미리스톨레산(14:1)(㎎),미리스톨레산(14:1)(%),팔미톨레산(16:1)(g),팔미톨레산(16:1)(㎎),팔미톨레산(16:1)(%),헵타데센산(17:1)(㎎),올레산(18:1(n-9))(g),올레산(18:1(n-9))(㎎),올레산(18:1(n-9))(%),박센산(18:1(n-7))(g),박센산(18:1(n-7))(㎎),가돌레산(20:1)(g),가돌레산(20:1)(㎎),가돌레산(20:1)(%),에루크산(22:1)(㎎),에루크산(22:1)(%),네르본산(24:1)(㎎),총 다중 불포화지방산(g),총 다중 불포화지방산(%),리놀레산(18:2(n-6)c)(g),리놀레산(18:2(n-6)c)(㎎),리놀레산(18:2(n-6)c)(%),알파 리놀렌산(18:3(n-3))(g),알파 리놀렌산(18:3(n-3))(㎎),리놀렌산(18:3(n-3)(%),감마 리놀렌산(18:3(n-6))(g),감마 리놀렌산(18:3(n-6))(㎎),스테아리돈산(18:4)(%),에이코사디에노산(20:2(n-6))(g),에이코사디에노산(20:2(n-6))(㎎),에이코사트리에노산(20:3(n-3))(㎎),에이코사트리에노산(20:3(n-6))(g),에이코사트리에노산(20:3(n-6))(㎎),아라키돈산(20:4(n-6))(g),아라키돈산(20:4(n-6))(㎎),아라키돈산(20:4(n-6))(%),에이코사테트라에노산(20:4(n-3))(㎎),에이코사펜타에노산(20:5(n-3))(g),에이코사펜타에노산(20:5(n-3))(㎎),에이코사펜타에노산(20:5(n-3))(%),도코사디에노산(22:2)(㎎),도코사펜타에노산(22:5(n-3))(g),도코사펜타에노산(22:5(n-3))(㎎),도코사펜타에노산(22:5(n-3))(%),도코사헥사에노산(22:6(n-3))(g),도코사헥사에노산(22:6(n-3))(㎎),도코사헥사에노산(22:6(n-3))(%),EPA와 DHA의 합(㎎),오메가 3 지방산(g),오메가 6 지방산(g),트랜스 지방산(g),트랜스 올레산(18:1(n-9)t)(g),트랜스 올레산(18:1(n-9)t)(㎎),트랜스 리놀레산 (18:2t)(g),트랜스 리놀레산 (18:2t)(㎎),트랜스 리놀렌산(18:3t)(g),트랜스 리놀렌산(18:3t)(㎎),트랜스 리놀렌산(18:3t)(%),냉산가용성물질(㎎),총 불포화지방산(g),식염상당량(g),회분(g),가식부(%),산가용성물질(%),카페인(㎎)
0,1,음식,품목대표,꿩불고기,구이류,육류구이,500.0,g,-,-,368.8,412.6,-,33.5,8.5,0,39.7,16.9,7.2,2.8,2.8,0.7,3.5,0,0,0,9.8,0,0,0,0,0,0,105.61,0,4.0,85.39,458.05,0,1243.12,1264.31,3.99,0.32,0,0.68,0,47.55,0,0,0,0,0,0.0,1424.58,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,8.73,0.06,0,0,0,0,0.0,0,0.33,0,3.61,0,0,0,0,0,0,0,0,0,0,0,63.13,0,0,0,0.0,0,2.99,0,0,0,0,0,1284.37582123574,2328.59892766839,2484.75047814224,645.190070073169,1274.92730261488,1410.84127771718,0,1367.68831341948,848.539312406619,2205.5847774439,0,919.805669181432,276.498720836072,1642.38119022329,2781.77304833044,4784.60634708081,1419.92479570739,1092.29548260871,1264.95795056827,0,0,0,0,0,0,0,106.18,0,0,1.9,0,0,0,0,0,0,0,0.0,0,0.0071148347196189,0,0,0,0.0317835536096363,0,0,0,1.28384114493856,0,0,0,0.527395267901326,0,0,0.0290123491481805,0,0,0,0,0,0,0,0,0.0,0,0,0.0813516573054785,0,0,0,2.30772104748742,0,0,0.113462530850897,0,0.0279762322988018,0,0,0,0,0,0,0,3.23601791813763,0,0,0.656722581376586,0,0,0.018708284652282,0,0,0.0066488700771641,0,0,0.0,0,0.142840481460645,0,0,0,0.0,0,0,0,0.0,0,0,0.0234269823295255,0,0,0,0,0,0.1,0.018116327971628,0,0.0534160839712029,0,0.0,0,0,0,0,0,5.8,0,0,0
1,2,음식,품목대표,닭갈비,구이류,육류구이,400.0,g,-,-,595.61,276.4,-,45.9,25.8,0,44.9,21.2,3.6,5.9,4.8,0.0,6.9,0,0,0,11.6,0,0,0,0,0,0,98.64,0,3.38,104.42,505.25,0,1200.24,1535.83,3.55,0.34,0,0.97,0,57.56,0,0,0,0,0,38.61,2133.37,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,6.82,0.04,0,0,0,0,0.24,0,0.37,0,1.23,0,0,0,0,0,0,0,0,0,0,0,108.13,0,0,0,1.12,0,5.54,0,0,0,0,0,1796.24151075719,3245.40464371184,3593.31213240036,878.040312336548,1830.14127194101,2019.9394227759,0,1966.31473590112,1198.58224877347,2851.72274483,0,1310.51326329693,307.730115350377,2465.1998212526,4361.76110854525,7778.83843669619,2230.07868308554,1865.82488189018,1833.38617767634,0,0,0,0,0,0,0,193.4,0,0,6.0,0,0,0,0,0,0,0,0.0016983071768326,0,0.0317943799610758,0,0,0,0.179374770348105,0,0,0,4.48483692256034,0,0,0,1.27094632800629,0,0,0.031974799247989,0,0,0,0,0,0,0,0,0.0505025093215654,0,0,1.29026338814361,0,0,0,8.11557700814867,0,0,0.464755835992049,0,0.0821514653597206,0,0,0,0,0,0,0,4.85129439150118,0,0,0.443452616478064,0,0,0.0207316688429758,0,0,0.0266817256973322,0,0,0.0403311208335205,0,0.127788794975451,0,0,0,0.0061434614772668,0,0,0,0.0157059786402594,0,0,0.009782043963298,0,0,0,0,0,0.2,0.0750485023295658,0,0.0646068457814869,0,0.0132108495883938,0,0,0,0,0,7.0,0,0,0
3,4,음식,품목대표,닭꼬치,구이류,육류구이,70.0,g,-,-,176.722661137077,35.3079065997919,-,11.561723041353,8.56501389120873,0,13.3476609876966,3.15210668563089,0.106114460794218,0.816880663046302,1.63997930717926,0.0,0.589132254611108,0,0,0,2.07170833333333,0,0,0,0,0,0,17.6750468292727,0,7.63691788880754,0.0,122.798123571596,0,152.663030000484,286.911027516294,0.0,0.0,0,0.0,0,0.0,0,0,0,0,0,14.7534711264017,46.097313453717,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0.0,0.0,0,0,0,0,0.226146222103857,0,0.18408413082574,0,1.71325274082621,0,0,0,0,0,0,0,0,0,0,0,0.0,0,0,0,0.0,0,0.0,0,0,0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0.0,0.0,0.0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0,0,0,0,0,31.4437176472469,0,0,2.31532784916834,0,0,0,0,0,0,0,0.0,0,0.0,0,0,0,0.1,0,0,0,1.8,0,0,0,0.5,0,0,0.0,0,0,0,0,0,0,0,0,0.0,0,0,0.4,0,0,0,3.3,0,0,0.2,0,0.0,0,0,0,0,0,0,0,1.9,0,0,0.2,0,0,0.0,0,0,0.0,0,0,0.0,0,0.0,0,0,0,0.0,0,0,0,0.0,0,0,0.0,0,0,0,0,0,0.0438631942105014,0.0,0,0.0,0,0.0,0,0,0,0,0,1.2176954799497,0,0,0
4,5,음식,품목대표,더덕구이,구이류,채소류구이,100.0,g,-,-,184.0,58.1,-,3.1,5.2,0,31.1,11.6,2.2,2.7,1.5,0.0,5.1,0,0,0,6.8,0,0,0,0,0,0,46.42,0,1.43,38.21,88.17,0,262.44,743.37,0.59,0.13,0,0.42,0,0.0,0,0,0,0,0,0.0,481.44,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,3.89,1.47,0,0,0,0,0.23,0,0.08,0,0.18,0,0,0,0,0,0,0,0,0,0,0,16.77,0,0,0,0.0,0,1.34,0,0,0,0,0,69.84,126.53,90.72,16.36,82.78,70.97,0,87.91,44.56,457.03,0,33.86,9.73,91.19,203.15,620.8,83.58,117.2,83.49,0,0,0,0,0,0,0,0.12,0,0,0.8,0,0,0,0,0,0,0,0.0,0,0.0,0,0,0,0.0,0,0,0,0.5,0,0,0,0.2,0,0,0.0,0,0,0,0,0,0,0,0,0.0,0,0,0.0,0,0,0,1.3,0,0,0.1,0,0.0,0,0,0,0,0,0,0,2.3,0,0,0.4,0,0,0.0,0,0,0.0,0,0,0.0,0,0.0,0,0,0,0.0,0,0,0,0.0,0,0,0.0,0,0,0,0,0,0.0,0.0,0,0.0,0,0.0,0,0,0,0,0,2.5,0,0,0
5,6,음식,품목대표,도미구이,구이류,어패류구이,250.0,g,-,-,397.0,163.3,-,61.1,16.5,0,2.1,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0,5.9,0,0,0,0,0,0,158.8,0,0.97,120.37,690.91,0,1108.02,1582.17,1.45,0.06,0,0.06,0,281.39,0,0,0,0,0,65.65,2.3,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,3.76,0.0,0,0,0,0,0.1,0,0.27,0,6.35,0,0,0,0,0,0,0,0,0,0,0,37.98,0,0,0,7.45,0,0.84,0,0,0,0,0,2139.19,4277.88,4920.98,1725.16,2222.94,2583.86,0,2388.48,1351.76,3926.03,0,1958.54,481.77,3337.83,5706.62,8361.83,3076.27,2060.24,2382.06,0,0,0,0,0,0,0,211.24,0,0,3.8,0,0,0,0,0,0,0,0.0,0,0.0,0,0,0,0.4,0,0,0,2.5,0,0,0,0.8,0,0,0.1,0,0,0,0,0,0,0,0,0.0,0,0,0.6,0,0,0,2.9,0,0,0.4,0,0.2,0,0,0,0,0,0,0,1.9,0,0,0.3,0,0,0.0,0,0,0.0,0,0,0.1,0,0.2,0,0,0,0.6,0,0,0,0.3,0,0,1.6,0,0,0,0,0,0.1,0.0,0,0.0,0,0.1,0,0,0,0,0,7.0,0,0,0


In [9]:
food_nutrients_copy.info()

<class 'pandas.core.frame.DataFrame'>
Int64Index: 49807 entries, 0 to 58596
Columns: 232 entries, NO to 카페인(㎎)
dtypes: float64(1), int64(9), object(222)
memory usage: 88.5+ MB


## 2. 타입 변경

In [10]:
food_nutrients_copy = food_nutrients_copy.astype({'1회제공량':'float'})
food_nutrients_copy.loc[: ,'단백질(g)':'카페인(㎎)'] = food_nutrients_copy.loc[: ,'단백질(g)':'카페인(㎎)'].astype(float)



In [11]:
food_nutrients_copy.loc[: ,'총내용량(g)':'에너지(㎉)'] =\
food_nutrients_copy.loc[: ,'총내용량(g)':'에너지(㎉)'].replace(['-'], 0)

food_nutrients_copy.loc[: ,'총내용량(g)':'에너지(㎉)'] = \
food_nutrients_copy.loc[: ,'총내용량(g)':'에너지(㎉)'].astype(float)

In [12]:
food_nutrients_copy.loc[: ,'수분(g)':'수분(%)'] = food_nutrients_copy.loc[: ,'수분(g)':'수분(%)'].replace(['-', 'tr', 'Tr'], 0)
food_nutrients_copy.loc[: ,'수분(g)':'수분(%)'] = \
food_nutrients_copy.loc[: ,'수분(g)':'수분(%)'].astype(float)

## 3. 영양소 별 데이터 단위 통일

In [13]:
# food_nutrients_copy2 = food_nutrients_copy.copy()

In [14]:
gTomg = 0.001

for col in food_nutrients_copy.loc[: ,'단백질(g)':'카페인(㎎)']:
    if '㎎' in col:
        food_nutrients_copy[col] = food_nutrients_copy[col] * gTomg
for col in food_nutrients_copy.loc[: ,'단백질(g)':'카페인(㎎)']:
    if '㎍' in col:
        food_nutrients_copy[col] = food_nutrients_copy[col] * gTomg * gTomg


In [15]:
food_nutrients_copy.info()

<class 'pandas.core.frame.DataFrame'>
Int64Index: 49807 entries, 0 to 58596
Columns: 232 entries, NO to 카페인(㎎)
dtypes: float64(225), int64(1), object(6)
memory usage: 88.5+ MB


##### 영향소별 비율을 구하기 위해 데이터를 살펴본 결과 데이터가 복잡.?
ex)아라키돈산, 에이코사펜타에노산 같은 영양소 데이터의 경우 g, mg, %로 나뉘어져 있으며 식품에 따라 표기된 위치가 다르다 다행히 g에도 적혀있고 mg에도 적히는 등 중복으로 된 것은 없어서 통합하면 될 것 같다. % 에 표기된 경우 연산 없이 바로 %값을 사용 -> %값이 있는 데이터의 경우 연산을 진행할 때 제외하고 한다....


In [16]:
def make_nutrientt_list(dataframe, _list, giho):
    for col in dataframe:
        if giho in col:
             _list.append(col)

def make_nutrientt_list_delete_giho(dataframe, _list, giho):
    for col in dataframe:
        if giho in col:
            parentheses = col.find('giho')
            _list.append(col[:parentheses - 2 ])

#
nutrient_persent_list = []     #퍼센트로 표기된 영양소 리스트
nutrient_gram_list = []        #그람으로 표기된 영양소 리스트
nutrient_milligram_list = []   #밀리그람으로 표기된 영양소 리스트
nutrient_microgram_list = []   #마이크로 그람으로 표기된 영양소 리스트

#기호 제거 리스트
_nutrient_persent_list = []
_nutrient_gram_list = []
_nutrient_milligram_list = []
_nutrient_microgram_list = []

fn = food_nutrients_copy.loc[: ,'단백질(g)':'카페인(㎎)']
make_nutrientt_list(fn, nutrient_persent_list, '%')
make_nutrientt_list(fn, nutrient_gram_list, 'g')
make_nutrientt_list(fn, nutrient_milligram_list, '㎎')
make_nutrientt_list(fn, nutrient_microgram_list, '㎍')

make_nutrientt_list_delete_giho(fn, _nutrient_persent_list, '%')
make_nutrientt_list_delete_giho(fn, _nutrient_gram_list, 'g')
make_nutrientt_list_delete_giho(fn, _nutrient_milligram_list, '㎎')
make_nutrientt_list_delete_giho(fn, _nutrient_microgram_list, '㎍')


In [17]:
(food_nutrients_copy[nutrient_persent_list]>0.0).sum()

integrated_G_MG = []
integrated_MG_UG = []

for nutrient in _nutrient_milligram_list:
    if nutrient in _nutrient_gram_list:
        integrated_G_MG.append(nutrient)
    if nutrient in _nutrient_microgram_list:
        integrated_MG_UG.append(nutrient)

have_percent = []
for nutrient in _nutrient_persent_list:
    if nutrient in _nutrient_gram_list:
        have_percent.append(nutrient + '(%)')
    if nutrient in _nutrient_microgram_list:
        have_percent.append(nutrient + '(%)')

print(integrated_G_MG, integrated_MG_UG, have_percent)
food_nutrients_copy.info()

['칼륨', '비타민 C', '콜린', '총 아미노산', '콜레스테롤', '부티르산(4:0)', '카프로산(6:0)', '카프릴산(8:0)', '카프르산(10:0)', '라우르산(12:0)', '미리스트산(14:0)', '팔미트산(16:0)', '스테아르산(18:0)', '아라키드산(20:0)', '미리스톨레산(14:1)', '팔미톨레산(16:1)', '올레산(18:1(n-9))', '박센산(18:1(n-7))', '가돌레산(20:1)', '리놀레산(18:2(n-6)c)', '알파 리놀렌산(18:3(n-3))', '감마 리놀렌산(18:3(n-6))', '에이코사디에노산(20:2(n-6))', '에이코사트리에노산(20:3(n-6))', '아라키돈산(20:4(n-6))', '에이코사펜타에노산(20:5(n-3))', '도코사펜타에노산(22:5(n-3))', '도코사헥사에노산(22:6(n-3))', '트랜스 올레산(18:1(n-9)t)', '트랜스 리놀레산 (18:2t)', '트랜스 리놀렌산(18:3t)'] ['철', '구리', '망간', '비타민 K', '비타민 B1', '비타민 B2', '판토텐산', '비타민 B6', '비타민 B12'] ['총 식이섬유(%)', '총 포화 지방산(%)', '라우르산(12:0)(%)', '미리스트산(14:0)(%)', '팔미트산(16:0)(%)', '스테아르산(18:0)(%)', '아라키드산(20:0)(%)', '총 단일 불포화지방산(%)', '미리스톨레산(14:1)(%)', '팔미톨레산(16:1)(%)', '올레산(18:1(n-9))(%)', '가돌레산(20:1)(%)', '총 다중 불포화지방산(%)', '리놀레산(18:2(n-6)c)(%)', '아라키돈산(20:4(n-6))(%)', '에이코사펜타에노산(20:5(n-3))(%)', '도코사펜타에노산(22:5(n-3))(%)', '도코사헥사에노산(22:6(n-3))(%)', '트랜스 리놀렌산(18:3t)(%)']
<class 'pandas.core.frame.DataFrame'>


#### -단위가 나뉘어서 작성된 영양소 통합 작업-
##### mg의 데이터들은 g으로 옮기고 ug의 데이터들은 mg으로 옮기고 옮긴 colum 삭제

In [18]:
# mg의 데이터들을 g으로 옮겨준다.
for nutrien in integrated_G_MG:
    food_nutrients_copy[nutrien+'(g)'] = food_nutrients_copy[nutrien+'(g)'].add(food_nutrients_copy[nutrien+'(㎎)'])
# ug의 데이터들을 mg으로 옮겨준다.
for nutrien in integrated_MG_UG:
    food_nutrients_copy[nutrien+'(㎎)'] = food_nutrients_copy[nutrien+'(㎎)'].add(food_nutrients_copy[nutrien+'(㎍)'])

In [19]:
food_nutrients_copy.head()

Unnamed: 0,NO,DB군,상용제품,식품명,식품대분류,식품상세분류,1회제공량,내용량_단위,총내용량(g),총내용량(mL),에너지(㎉),수분(g),수분(%),단백질(g),지방(g),지질-가식부 100g당,탄수화물(g),총당류(g),자당(g),포도당(g),과당(g),유당(g),맥아당(g),갈락토오스(g),당알콜(g),에리스리톨(g),총 식이섬유(g),총 식이섬유(mg),총 식이섬유(%),수용성 식이섬유(g),불용성 식이섬유(g),셀룰로오스(%),리그닌(%),칼슘(㎎),철(㎎),철(㎍),마그네슘(㎎),인(㎎),칼륨(g),칼륨(㎎),나트륨(㎎),아연(㎎),구리(㎎),구리(㎍),망간(㎎),망간(㎍),셀레늄(㎍),몰리브덴(㎍),요오드(㎍),염소(㎎),비타민 A(㎍),비타민 A(㎍ RE),레티놀(㎍),베타카로틴(㎍),레티놀A효능,비타민 D(D2+D3)(㎍),비타민 D2(㎍),비타민 D3(㎍),비타민 D1(㎍),비타민 E(㎎),비타민 E(㎎ α-TE),알파 토코페롤(㎎),베타 토코페롤(㎎),감마 토코페롤(㎎),델타 토코페롤(㎎),알파 토코트리에놀(㎎),베타 토코트리에놀(㎎),감마 토코트리에놀(㎎),델타 토코트리에놀(㎎),토코페롤(㎎),토코트리에놀(㎎),비타민 K(㎎),비타민 K(㎍),비타민 K1(㎍),비타민 K2(㎍),비타민 B1(㎎),비타민 B1(㎍),비타민 B2(㎎),비타민 B2(㎍),나이아신(㎎),나이아신(㎎ NE),나이아신(NE)(㎎),나이아신(NE)(㎎ NE),니코틴산 (㎎),니코틴아마이드(㎎),판토텐산(㎎),판토텐산(㎍),비타민 B6(㎎),비타민 B6(㎍),피리독신(㎎),비오틴(㎍),엽산(DFE)(㎍),엽산 - 천연 엽산(㎍),엽산 - 합성 엽산(㎍),비타민 B12(㎎),비타민 B12(㎍),비타민 C(g),비타민 C(㎎),콜린(g),콜린(㎎),총 아미노산(g),총 아미노산(㎎),필수 아미노산(㎎),이소류신(㎎),류신(㎎),라이신(㎎),메티오닌(㎎),페닐알라닌(㎎),트레오닌(㎎),트립토판(㎎),발린(㎎),히스티딘(㎎),아르기닌(㎎),비필수 아미노산(㎎),티로신(㎎),시스테인(㎎),알라닌(㎎),아스파르트산(㎎),글루탐산(㎎),글리신(㎎),프롤린(㎎),세린(㎎),타우린(㎎),글리신 베타인 (㎎),호마린(㎎),트리고넬린(㎎),리보핵산(㎎),데옥시리보핵산(㎎),콜레스테롤(g),콜레스테롤(㎎),총 지방산(g),총 필수 지방산(g),총 포화 지방산(g),총 포화 지방산(%),부티르산(4:0)(g),부티르산(4:0)(㎎),카프로산(6:0)(g),카프로산(6:0)(㎎),카프릴산(8:0)(g),카프릴산(8:0)(㎎),카프르산(10:0)(g),카프르산(10:0)(㎎),라우르산(12:0)(g),라우르산(12:0)(㎎),라우르산(12:0)(%),트라이데칸산(13:0)(㎎),미리스트산(14:0)(g),미리스트산(14:0)(㎎),미리스트산(14:0)(%),펜타데칸산(15:0)(㎎),팔미트산(16:0)(g),팔미트산(16:0)(㎎),팔미트산(16:0)(%),헵타데칸산(17:0)(㎎),스테아르산(18:0)(g),스테아르산(18:0)(㎎),스테아르산(18:0)(%),아라키드산(20:0)(g),아라키드산(20:0)(㎎),아라키드산(20:0)(%),헨에이코산산(21:0)(㎎),베헨산(22:0)(㎎),트리코산산(23:0)(㎎),리그노세르산(24:0)(㎎),총 단일 불포화지방산(g),총 단일 불포화지방산(%),미리스톨레산(14:1)(g),미리스톨레산(14:1)(㎎),미리스톨레산(14:1)(%),팔미톨레산(16:1)(g),팔미톨레산(16:1)(㎎),팔미톨레산(16:1)(%),헵타데센산(17:1)(㎎),올레산(18:1(n-9))(g),올레산(18:1(n-9))(㎎),올레산(18:1(n-9))(%),박센산(18:1(n-7))(g),박센산(18:1(n-7))(㎎),가돌레산(20:1)(g),가돌레산(20:1)(㎎),가돌레산(20:1)(%),에루크산(22:1)(㎎),에루크산(22:1)(%),네르본산(24:1)(㎎),총 다중 불포화지방산(g),총 다중 불포화지방산(%),리놀레산(18:2(n-6)c)(g),리놀레산(18:2(n-6)c)(㎎),리놀레산(18:2(n-6)c)(%),알파 리놀렌산(18:3(n-3))(g),알파 리놀렌산(18:3(n-3))(㎎),리놀렌산(18:3(n-3)(%),감마 리놀렌산(18:3(n-6))(g),감마 리놀렌산(18:3(n-6))(㎎),스테아리돈산(18:4)(%),에이코사디에노산(20:2(n-6))(g),에이코사디에노산(20:2(n-6))(㎎),에이코사트리에노산(20:3(n-3))(㎎),에이코사트리에노산(20:3(n-6))(g),에이코사트리에노산(20:3(n-6))(㎎),아라키돈산(20:4(n-6))(g),아라키돈산(20:4(n-6))(㎎),아라키돈산(20:4(n-6))(%),에이코사테트라에노산(20:4(n-3))(㎎),에이코사펜타에노산(20:5(n-3))(g),에이코사펜타에노산(20:5(n-3))(㎎),에이코사펜타에노산(20:5(n-3))(%),도코사디에노산(22:2)(㎎),도코사펜타에노산(22:5(n-3))(g),도코사펜타에노산(22:5(n-3))(㎎),도코사펜타에노산(22:5(n-3))(%),도코사헥사에노산(22:6(n-3))(g),도코사헥사에노산(22:6(n-3))(㎎),도코사헥사에노산(22:6(n-3))(%),EPA와 DHA의 합(㎎),오메가 3 지방산(g),오메가 6 지방산(g),트랜스 지방산(g),트랜스 올레산(18:1(n-9)t)(g),트랜스 올레산(18:1(n-9)t)(㎎),트랜스 리놀레산 (18:2t)(g),트랜스 리놀레산 (18:2t)(㎎),트랜스 리놀렌산(18:3t)(g),트랜스 리놀렌산(18:3t)(㎎),트랜스 리놀렌산(18:3t)(%),냉산가용성물질(㎎),총 불포화지방산(g),식염상당량(g),회분(g),가식부(%),산가용성물질(%),카페인(㎎)
0,1,음식,품목대표,꿩불고기,구이류,육류구이,500.0,g,0.0,0.0,368.8,412.6,0.0,33.5,8.5,0.0,39.7,16.9,7.2,2.8,2.8,0.7,3.5,0.0,0.0,0.0,9.8,0.0,0.0,0.0,0.0,0.0,0.0,0.10561,4e-06,4e-06,0.08539,0.45805,1.24312,1.24312,1.26431,0.00399,0.00032,0.0,0.00068,0.0,4.8e-05,0.0,0.0,0.0,0.0,0.0,0.0,0.001425,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.00873,6e-05,0.0,0.0,0.0,0.0,0.0,0.0,0.00033,0.0,0.00361,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,6.3e-05,0.0,0.0,0.0,0.0,0.00299,0.00299,0.0,0.0,0.0,0.0,0.0,1.284376,2.328599,2.48475,0.64519,1.274927,1.410841,0.0,1.367688,0.848539,2.205585,0.0,0.919806,0.276499,1.642381,2.781773,4.784606,1.419925,1.092295,1.264958,0.0,0.0,0.0,0.0,0.0,0.0,0.10618,0.10618,0.0,0.0,1.9,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.007115,0.0,0.0,0.0,0.031784,0.0,0.0,0.0,1.283841,0.0,0.0,0.0,0.527395,0.0,0.0,0.029012,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.081352,0.0,0.0,0.0,2.307721,0.0,0.0,0.113463,0.0,0.027976,0.0,0.0,0.0,0.0,0.0,0.0,0.0,3.236018,0.0,0.0,0.656723,0.0,0.0,0.018708,0.0,0.0,0.006649,0.0,0.0,0.0,0.0,0.14284,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.023427,0.0,0.0,0.0,0.0,0.0,0.1,0.018116,0.0,0.053416,0.0,0.0,0.0,0.0,0.0,0.0,0.0,5.8,0.0,0.0,0.0
1,2,음식,품목대표,닭갈비,구이류,육류구이,400.0,g,0.0,0.0,595.61,276.4,0.0,45.9,25.8,0.0,44.9,21.2,3.6,5.9,4.8,0.0,6.9,0.0,0.0,0.0,11.6,0.0,0.0,0.0,0.0,0.0,0.0,0.09864,3.38e-06,3.38e-06,0.10442,0.50525,1.20024,1.20024,1.53583,0.00355,0.00034,0.0,0.00097,0.0,5.8e-05,0.0,0.0,0.0,0.0,0.0,3.9e-05,0.002133,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.00682,4e-05,0.0,0.0,0.0,0.0,0.00024,0.0,0.00037,0.0,0.00123,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.000108,0.0,0.0,1e-06,1e-06,0.00554,0.00554,0.0,0.0,0.0,0.0,0.0,1.796242,3.245405,3.593312,0.87804,1.830141,2.019939,0.0,1.966315,1.198582,2.851723,0.0,1.310513,0.30773,2.4652,4.361761,7.778838,2.230079,1.865825,1.833386,0.0,0.0,0.0,0.0,0.0,0.0,0.1934,0.1934,0.0,0.0,6.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.001698,0.0,0.031794,0.0,0.0,0.0,0.179375,0.0,0.0,0.0,4.484837,0.0,0.0,0.0,1.270946,0.0,0.0,0.031975,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.050503,0.0,0.0,1.290263,0.0,0.0,0.0,8.115577,0.0,0.0,0.464756,0.0,0.082151,0.0,0.0,0.0,0.0,0.0,0.0,0.0,4.851294,0.0,0.0,0.443453,0.0,0.0,0.020732,0.0,0.0,0.026682,0.0,0.0,0.040331,0.0,0.127789,0.0,0.0,0.0,0.006143,0.0,0.0,0.0,0.015706,0.0,0.0,0.009782,0.0,0.0,0.0,0.0,0.0,0.2,0.075049,0.0,0.064607,0.0,0.013211,0.0,0.0,0.0,0.0,0.0,7.0,0.0,0.0,0.0
3,4,음식,품목대표,닭꼬치,구이류,육류구이,70.0,g,0.0,0.0,176.722661,35.307907,0.0,11.561723,8.565014,0.0,13.347661,3.152107,0.106114,0.816881,1.639979,0.0,0.589132,0.0,0.0,0.0,2.071708,0.0,0.0,0.0,0.0,0.0,0.0,0.017675,7.636918e-06,7.636918e-06,0.0,0.122798,0.152663,0.152663,0.286911,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.5e-05,4.6e-05,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.000226,0.0,0.000184,0.0,0.001713,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.031444,0.031444,0.0,0.0,2.315328,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.1,0.0,0.0,0.0,1.8,0.0,0.0,0.0,0.5,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.4,0.0,0.0,0.0,3.3,0.0,0.0,0.2,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.9,0.0,0.0,0.2,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.043863,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.217695,0.0,0.0,0.0
4,5,음식,품목대표,더덕구이,구이류,채소류구이,100.0,g,0.0,0.0,184.0,58.1,0.0,3.1,5.2,0.0,31.1,11.6,2.2,2.7,1.5,0.0,5.1,0.0,0.0,0.0,6.8,0.0,0.0,0.0,0.0,0.0,0.0,0.04642,1.43e-06,1.43e-06,0.03821,0.08817,0.26244,0.26244,0.74337,0.00059,0.00013,0.0,0.00042,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.000481,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.00389,0.00147,0.0,0.0,0.0,0.0,0.00023,0.0,8e-05,0.0,0.00018,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.7e-05,0.0,0.0,0.0,0.0,0.00134,0.00134,0.0,0.0,0.0,0.0,0.0,0.06984,0.12653,0.09072,0.01636,0.08278,0.07097,0.0,0.08791,0.04456,0.45703,0.0,0.03386,0.00973,0.09119,0.20315,0.6208,0.08358,0.1172,0.08349,0.0,0.0,0.0,0.0,0.0,0.0,0.00012,0.00012,0.0,0.0,0.8,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.5,0.0,0.0,0.0,0.2,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.3,0.0,0.0,0.1,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,2.3,0.0,0.0,0.4,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,2.5,0.0,0.0,0.0
5,6,음식,품목대표,도미구이,구이류,어패류구이,250.0,g,0.0,0.0,397.0,163.3,0.0,61.1,16.5,0.0,2.1,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,5.9,0.0,0.0,0.0,0.0,0.0,0.0,0.1588,9.7e-07,9.7e-07,0.12037,0.69091,1.10802,1.10802,1.58217,0.00145,6e-05,0.0,6e-05,0.0,0.000281,0.0,0.0,0.0,0.0,0.0,6.6e-05,2e-06,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.00376,0.0,0.0,0.0,0.0,0.0,0.0001,0.0,0.00027,0.0,0.00635,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,3.8e-05,0.0,0.0,7e-06,7e-06,0.00084,0.00084,0.0,0.0,0.0,0.0,0.0,2.13919,4.27788,4.92098,1.72516,2.22294,2.58386,0.0,2.38848,1.35176,3.92603,0.0,1.95854,0.48177,3.33783,5.70662,8.36183,3.07627,2.06024,2.38206,0.0,0.0,0.0,0.0,0.0,0.0,0.21124,0.21124,0.0,0.0,3.8,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.4,0.0,0.0,0.0,2.5,0.0,0.0,0.0,0.8,0.0,0.0,0.1,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.6,0.0,0.0,0.0,2.9,0.0,0.0,0.4,0.0,0.2,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.9,0.0,0.0,0.3,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.1,0.0,0.2,0.0,0.0,0.0,0.6,0.0,0.0,0.0,0.3,0.0,0.0,1.6,0.0,0.0,0.0,0.0,0.0,0.1,0.0,0.0,0.0,0.0,0.1,0.0,0.0,0.0,0.0,0.0,7.0,0.0,0.0,0.0


In [20]:
# food_nutrients_copy3 = food_nutrients_copy2.copy()
delete_G_MG = integrated_G_MG[:]
delete_MG_UG = integrated_MG_UG[:]

In [21]:
for i in range(len(integrated_G_MG)):
    delete_G_MG[i] = integrated_G_MG[i] + '(㎎)'

for i in range(len(integrated_MG_UG)):
    delete_MG_UG[i] = integrated_MG_UG[i] + '(㎍)'

food_nutrients_copy = food_nutrients_copy.drop(delete_G_MG, axis = 1)
food_nutrients_copy = food_nutrients_copy.drop(delete_MG_UG, axis = 1)

### %로 표기된 영양소 정제

In [22]:
food_nutrients_copy[(food_nutrients_copy['아라키돈산(20:4(n-6))(g)'] != 0) & (food_nutrients_copy['아라키돈산(20:4(n-6))(%)'] != 0)]

Unnamed: 0,NO,DB군,상용제품,식품명,식품대분류,식품상세분류,1회제공량,내용량_단위,총내용량(g),총내용량(mL),에너지(㎉),수분(g),수분(%),단백질(g),지방(g),지질-가식부 100g당,탄수화물(g),총당류(g),자당(g),포도당(g),과당(g),유당(g),맥아당(g),갈락토오스(g),당알콜(g),에리스리톨(g),총 식이섬유(g),총 식이섬유(mg),총 식이섬유(%),수용성 식이섬유(g),불용성 식이섬유(g),셀룰로오스(%),리그닌(%),칼슘(㎎),철(㎎),마그네슘(㎎),인(㎎),칼륨(g),나트륨(㎎),아연(㎎),구리(㎎),망간(㎎),셀레늄(㎍),몰리브덴(㎍),요오드(㎍),염소(㎎),비타민 A(㎍),비타민 A(㎍ RE),레티놀(㎍),베타카로틴(㎍),레티놀A효능,비타민 D(D2+D3)(㎍),비타민 D2(㎍),비타민 D3(㎍),비타민 D1(㎍),비타민 E(㎎),비타민 E(㎎ α-TE),알파 토코페롤(㎎),베타 토코페롤(㎎),감마 토코페롤(㎎),델타 토코페롤(㎎),알파 토코트리에놀(㎎),베타 토코트리에놀(㎎),감마 토코트리에놀(㎎),델타 토코트리에놀(㎎),토코페롤(㎎),토코트리에놀(㎎),비타민 K(㎎),비타민 K1(㎍),비타민 K2(㎍),비타민 B1(㎎),비타민 B2(㎎),나이아신(㎎),나이아신(㎎ NE),나이아신(NE)(㎎),나이아신(NE)(㎎ NE),니코틴산 (㎎),니코틴아마이드(㎎),판토텐산(㎎),비타민 B6(㎎),피리독신(㎎),비오틴(㎍),엽산(DFE)(㎍),엽산 - 천연 엽산(㎍),엽산 - 합성 엽산(㎍),비타민 B12(㎎),비타민 C(g),콜린(g),총 아미노산(g),필수 아미노산(㎎),이소류신(㎎),류신(㎎),라이신(㎎),메티오닌(㎎),페닐알라닌(㎎),트레오닌(㎎),트립토판(㎎),발린(㎎),히스티딘(㎎),아르기닌(㎎),비필수 아미노산(㎎),티로신(㎎),시스테인(㎎),알라닌(㎎),아스파르트산(㎎),글루탐산(㎎),글리신(㎎),프롤린(㎎),세린(㎎),타우린(㎎),글리신 베타인 (㎎),호마린(㎎),트리고넬린(㎎),리보핵산(㎎),데옥시리보핵산(㎎),콜레스테롤(g),총 지방산(g),총 필수 지방산(g),총 포화 지방산(g),총 포화 지방산(%),부티르산(4:0)(g),카프로산(6:0)(g),카프릴산(8:0)(g),카프르산(10:0)(g),라우르산(12:0)(g),라우르산(12:0)(%),트라이데칸산(13:0)(㎎),미리스트산(14:0)(g),미리스트산(14:0)(%),펜타데칸산(15:0)(㎎),팔미트산(16:0)(g),팔미트산(16:0)(%),헵타데칸산(17:0)(㎎),스테아르산(18:0)(g),스테아르산(18:0)(%),아라키드산(20:0)(g),아라키드산(20:0)(%),헨에이코산산(21:0)(㎎),베헨산(22:0)(㎎),트리코산산(23:0)(㎎),리그노세르산(24:0)(㎎),총 단일 불포화지방산(g),총 단일 불포화지방산(%),미리스톨레산(14:1)(g),미리스톨레산(14:1)(%),팔미톨레산(16:1)(g),팔미톨레산(16:1)(%),헵타데센산(17:1)(㎎),올레산(18:1(n-9))(g),올레산(18:1(n-9))(%),박센산(18:1(n-7))(g),가돌레산(20:1)(g),가돌레산(20:1)(%),에루크산(22:1)(㎎),에루크산(22:1)(%),네르본산(24:1)(㎎),총 다중 불포화지방산(g),총 다중 불포화지방산(%),리놀레산(18:2(n-6)c)(g),리놀레산(18:2(n-6)c)(%),알파 리놀렌산(18:3(n-3))(g),리놀렌산(18:3(n-3)(%),감마 리놀렌산(18:3(n-6))(g),스테아리돈산(18:4)(%),에이코사디에노산(20:2(n-6))(g),에이코사트리에노산(20:3(n-3))(㎎),에이코사트리에노산(20:3(n-6))(g),아라키돈산(20:4(n-6))(g),아라키돈산(20:4(n-6))(%),에이코사테트라에노산(20:4(n-3))(㎎),에이코사펜타에노산(20:5(n-3))(g),에이코사펜타에노산(20:5(n-3))(%),도코사디에노산(22:2)(㎎),도코사펜타에노산(22:5(n-3))(g),도코사펜타에노산(22:5(n-3))(%),도코사헥사에노산(22:6(n-3))(g),도코사헥사에노산(22:6(n-3))(%),EPA와 DHA의 합(㎎),오메가 3 지방산(g),오메가 6 지방산(g),트랜스 지방산(g),트랜스 올레산(18:1(n-9)t)(g),트랜스 리놀레산 (18:2t)(g),트랜스 리놀렌산(18:3t)(g),트랜스 리놀렌산(18:3t)(%),냉산가용성물질(㎎),총 불포화지방산(g),식염상당량(g),회분(g),가식부(%),산가용성물질(%),카페인(㎎)


In [23]:
food_nutrients_copy1 = food_nutrients_copy.copy()

In [24]:
food_nutrients_copy1.reset_index(drop=True, inplace=True)

In [25]:
# for i in range(1, len(food_nutrients_copy1.index)):
#     if food_nutrients_copy1.loc[i, '총 포화 지방산(g)'] == 0:
#         food_nutrients_copy1.loc[i, '총 포화 지방산(g)'] = \
#             food_nutrients_copy1.loc[i, '총 포화 지방산(%)'] * food_nutrients_copy1.loc[i, '1회제공량']/100


In [26]:
# for i in range(1, len(food_nutrients_copy1.index)):
#     if food_nutrients_copy1.loc[i, '라우르산(12:0)(g)'] == 0:
#         food_nutrients_copy1.loc[i, '라우르산(12:0)(g)'] = \
#             food_nutrients_copy1.loc[i, '라우르산(12:0)(%)'] * food_nutrients_copy1.loc[i, '1회제공량']/100

In [27]:
for name in have_percent:
    name = name[:-3]
    for i in range(1, len(food_nutrients_copy1.index)):
        if food_nutrients_copy1.loc[i, name + '(g)'] == 0:
            food_nutrients_copy1.loc[i, name+ '(g)'] = \
                food_nutrients_copy1.loc[i, name + '(%)'] * food_nutrients_copy1.loc[i, '1회제공량'] / 100

In [28]:
# for col in food_nutrients_copy3.loc[: ,'단백질(g)':'카페인(㎎)']:
#     if col not in nutrient_persent_list:
#         food_nutrients_copy3[col] = food_nutrients_copy3[col] / food_nutrients_copy3['1회제공량'] *100

# food_nutrients_copy3.head()

'''데이터 통일성 부족;;;;;
어떤 식품은 1회제공량을 기준으로 영양소 량을 기록한게 있다면
어떤 식품은 총내용량을 기준으로 영양소 량을 기록한게 있다
1회 제공량 기준으로 비율을 구하면 값이 6000이상이 나오는 등 결치값 발생
각 식품별 영양소 비율을 구하는것은 포기.....
그냥 식품별 최대값을 구하고 그 최대값이 어떤 영양소인지만 구한다.
'''

'데이터 통일성 부족;;;;;\n어떤 식품은 1회제공량을 기준으로 영양소 량을 기록한게 있다면\n어떤 식품은 총내용량을 기준으로 영양소 량을 기록한게 있다\n1회 제공량 기준으로 비율을 구하면 값이 6000이상이 나오는 등 결치값 발생\n각 식품별 영양소 비율을 구하는것은 포기.....\n그냥 식품별 최대값을 구하고 그 최대값이 어떤 영양소인지만 구한다.\n'

In [29]:
# food_nutrients_copy3.to_excel('통합 식품영양성분DB_정리본.xlsx')

In [30]:
food_nutrients_copy1.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 49807 entries, 0 to 49806
Columns: 192 entries, NO to 카페인(㎎)
dtypes: float64(185), int64(1), object(6)
memory usage: 73.0+ MB


In [31]:
pd.set_option('display.max_seq_items', None)
food_nutrients_copy1.columns

Index(['NO', 'DB군', '상용제품', '식품명', '식품대분류', '식품상세분류', '1회제공량', '내용량_단위',
       '총내용량(g)', '총내용량(mL)', '에너지(㎉)', '수분(g)', '수분(%)', '단백질(g)', '지방(g)',
       '지질-가식부 100g당', '탄수화물(g)', '총당류(g)', '자당(g)', '포도당(g)', '과당(g)',
       '유당(g)', '맥아당(g)', '갈락토오스(g)', '당알콜(g)', '에리스리톨(g)', '총 식이섬유(g)',
       '총 식이섬유(mg)', '총 식이섬유(%)', '수용성 식이섬유(g)', '불용성 식이섬유(g)', '셀룰로오스(%)',
       '리그닌(%)', '칼슘(㎎)', '철(㎎)', '마그네슘(㎎)', '인(㎎)', '칼륨(g)', '나트륨(㎎)',
       '아연(㎎)', '구리(㎎)', '망간(㎎)', '셀레늄(㎍)', '몰리브덴(㎍)', '요오드(㎍)', '염소(㎎)',
       '비타민 A(㎍)', '비타민 A(㎍ RE)', '레티놀(㎍)', '베타카로틴(㎍)', '레티놀A효능',
       '비타민 D(D2+D3)(㎍)', '비타민 D2(㎍)', '비타민 D3(㎍)', '비타민 D1(㎍)', '비타민 E(㎎)',
       '비타민 E(㎎ α-TE)', '알파 토코페롤(㎎)', '베타 토코페롤(㎎)', '감마 토코페롤(㎎)', '델타 토코페롤(㎎)',
       '알파 토코트리에놀(㎎)', '베타 토코트리에놀(㎎)', '감마 토코트리에놀(㎎)', '델타 토코트리에놀(㎎)',
       '토코페롤(㎎)', '토코트리에놀(㎎)', '비타민 K(㎎)', '비타민 K1(㎍)', '비타민 K2(㎍)',
       '비타민 B1(㎎)', '비타민 B2(㎎)', '나이아신(㎎)', '나이아신(㎎ NE)', '나이아신(NE)(㎎)',
       '나이아신(NE)(㎎ NE)', '니코틴산 (㎎)', '니코틴아마이드(㎎

##### 컬럼에서 단위 제거

In [32]:
food_nutrients_copy1.columns = ['NO', 'DB군', '상용제품', '식품명', '식품대분류', '식품상세분류', '1회제공량', '단위',
       '총내용량(g)', '총내용량(mL)', '에너지', '수분', '수분(%)', '단백질',
       '지방', '지질-가식부 100g당', '탄수화물', '총당류', '자당', '포도당',
       '과당', '유당', '맥아당', '갈락토오스', '당알콜', '에리스리톨',
       '총 식이섬유', '총 식이섬유', '총 식이섬유(%)', '수용성 식이섬유', '불용성 식이섬유',
       '셀룰로오스(%)', '리그닌(%)', '칼슘', '철', '마그네슘', '인', '칼륨',
       '나트륨', '아연', '구리', '망간', '셀레늄', '몰리브덴', '요오드',
       '염소', '비타민 A', '비타민 A(RE)', '레티놀', '베타카로틴', '레티놀A효능',
       '비타민 D(D2+D3)', '비타민 D2', '비타민 D3', '비타민 D1', '비타민 E',
       '비타민 E(α-TE)', '알파 토코페롤', '베타 토코페롤', '감마 토코페롤', '델타 토코페롤',
       '알파 토코트리에놀', '베타 토코트리에놀', '감마 토코트리에놀', '델타 토코트리에놀',
       '토코페롤', '토코트리에놀', '비타민 K', '비타민 K1', '비타민 K2',
       '비타민 B1', '비타민 B2', '나이아신', '나이아신(NE)', '나이아신(NE))',
       '나이아신(NE)(NE)', '니코틴산', '니코틴아마이드', '판토텐산', '비타민 B6',
       '피리독신', '비오틴', '엽산(DFE)', '엽산 - 천연 엽산', '엽산 - 합성 엽산',
       '비타민 B12', '비타민 C', '콜린', '총 아미노산', '필수 아미노산', '이소류신',
       '류신', '라이신', '메티오닌', '페닐알라닌', '트레오닌', '트립토판', '발린',
       '히스티딘', '아르기닌', '비필수 아미노산', '티로신', '시스테인', '알라닌',
       '아스파르트산', '글루탐산', '글리신', '프롤린', '세린', '타우린',
       '글리신 베타인 ', '호마린', '트리고넬린', '리보핵산', '데옥시리보핵산',
       '콜레스테롤', '총 지방산', '총 필수 지방산', '총 포화 지방산', '총 포화 지방산(%)',
       '부티르산(4:0)', '카프로산(6:0)', '카프릴산(8:0)', '카프르산(10:0)',
       '라우르산(12:0)', '라우르산(12:0)(%)', '트라이데칸산(13:0)', '미리스트산(14:0)',
       '미리스트산(14:0)(%)', '펜타데칸산(15:0)', '팔미트산(16:0)', '팔미트산(16:0)(%)',
       '헵타데칸산(17:0)', '스테아르산(18:0)', '스테아르산(18:0)(%)', '아라키드산(20:0)',
       '아라키드산(20:0)(%)', '헨에이코산산(21:0)', '베헨산(22:0)', '트리코산산(23:0)',
       '리그노세르산(24:0)', '총 단일 불포화지방산', '총 단일 불포화지방산(%)',
       '미리스톨레산(14:1)', '미리스톨레산(14:1)(%)', '팔미톨레산(16:1)',
       '팔미톨레산(16:1)(%)', '헵타데센산(17:1)', '올레산(18:1(n-9))',
       '올레산(18:1(n-9))(%)', '박센산(18:1(n-7))', '가돌레산(20:1)',
       '가돌레산(20:1)(%)', '에루크산(22:1)', '에루크산(22:1)(%)', '네르본산(24:1)',
       '총 다중 불포화지방산', '총 다중 불포화지방산(%)', '리놀레산(18:2(n-6)c)',
       '리놀레산(18:2(n-6)c)(%)', '알파 리놀렌산(18:3(n-3))', '리놀렌산(18:3(n-3)(%)',
       '감마 리놀렌산(18:3(n-6))', '스테아리돈산(18:4)(%)', '에이코사디에노산(20:2(n-6))',
       '에이코사트리에노산(20:3(n-3))', '에이코사트리에노산(20:3(n-6))',
       '아라키돈산(20:4(n-6))', '아라키돈산(20:4(n-6))(%)',
       '에이코사테트라에노산(20:4(n-3))', '에이코사펜타에노산(20:5(n-3))',
       '에이코사펜타에노산(20:5(n-3))(%)', '도코사디에노산(22:2)', '도코사펜타에노산(22:5(n-3))',
       '도코사펜타에노산(22:5(n-3))(%)', '도코사헥사에노산(22:6(n-3))',
       '도코사헥사에노산(22:6(n-3))(%)', 'EPA와 DHA의 합', '오메가 3 지방산',
       '오메가 6 지방산', '트랜스 지방산', '트랜스 올레산(18:1(n-9)t)',
       '트랜스 리놀레산 (18:2t)', '트랜스 리놀렌산(18:3t)', '트랜스 리놀렌산(18:3t)(%)',
       '냉산가용성물질', '총 불포화지방산', '식염상당량', '회분', '가식부(%)', '산가용성물질(%)',
       '카페인']


### %로 표기된 영양소 column 제거

In [33]:
food_nutrients_copy1 = food_nutrients_copy1.loc[:, ['NO', 'DB군', '상용제품', '식품명', '식품대분류', '식품상세분류', '1회제공량', '단위',
       '총내용량(g)', '총내용량(mL)', '에너지', '수분', '단백질',
       '지방', '탄수화물', '총당류', '자당', '포도당',
       '과당', '유당', '맥아당', '갈락토오스', '당알콜', '에리스리톨',
       '총 식이섬유', '수용성 식이섬유', '불용성 식이섬유',
       '칼슘', '철', '마그네슘', '인', '칼륨',
       '나트륨', '아연', '구리', '망간', '셀레늄', '몰리브덴', '요오드',
       '염소', '비타민 A', '비타민 A(RE)', '레티놀', '베타카로틴', '레티놀A효능',
       '비타민 D(D2+D3)', '비타민 D2', '비타민 D3', '비타민 D1', '비타민 E',
       '비타민 E(α-TE)', '알파 토코페롤', '베타 토코페롤', '감마 토코페롤', '델타 토코페롤',
       '알파 토코트리에놀', '베타 토코트리에놀', '감마 토코트리에놀', '델타 토코트리에놀',
       '토코페롤', '토코트리에놀', '비타민 K', '비타민 K1', '비타민 K2',
       '비타민 B1', '비타민 B2', '나이아신', '나이아신(NE)', '나이아신(NE))',
       '나이아신(NE)(NE)', '니코틴산', '니코틴아마이드', '판토텐산', '비타민 B6',
       '피리독신', '비오틴', '엽산(DFE)', '엽산 - 천연 엽산', '엽산 - 합성 엽산',
       '비타민 B12', '비타민 C', '콜린', '총 아미노산', '필수 아미노산', '이소류신',
       '류신', '라이신', '메티오닌', '페닐알라닌', '트레오닌', '트립토판', '발린',
       '히스티딘', '아르기닌', '비필수 아미노산', '티로신', '시스테인', '알라닌',
       '아스파르트산', '글루탐산', '글리신', '프롤린', '세린', '타우린',
       '글리신 베타인 ', '호마린', '트리고넬린', '리보핵산', '데옥시리보핵산',
       '콜레스테롤', '총 지방산', '총 필수 지방산', '총 포화 지방산',
       '부티르산(4:0)', '카프로산(6:0)', '카프릴산(8:0)', '카프르산(10:0)',
       '라우르산(12:0)', '트라이데칸산(13:0)', '미리스트산(14:0)',
       '펜타데칸산(15:0)', '팔미트산(16:0)',
       '헵타데칸산(17:0)', '스테아르산(18:0)', '아라키드산(20:0)',
       '헨에이코산산(21:0)', '베헨산(22:0)', '트리코산산(23:0)',
       '리그노세르산(24:0)', '총 단일 불포화지방산',
       '미리스톨레산(14:1)', '팔미톨레산(16:1)',
       '헵타데센산(17:1)', '올레산(18:1(n-9))',
       '박센산(18:1(n-7))', '가돌레산(20:1)',
       '에루크산(22:1)', '네르본산(24:1)',
       '총 다중 불포화지방산', '리놀레산(18:2(n-6)c)',
       '알파 리놀렌산(18:3(n-3))',
       '감마 리놀렌산(18:3(n-6))', '에이코사디에노산(20:2(n-6))',
       '에이코사트리에노산(20:3(n-3))', '에이코사트리에노산(20:3(n-6))',
       '아라키돈산(20:4(n-6))',
       '에이코사테트라에노산(20:4(n-3))', '에이코사펜타에노산(20:5(n-3))',
       '도코사디에노산(22:2)', '도코사펜타에노산(22:5(n-3))',
       '도코사헥사에노산(22:6(n-3))',
       'EPA와 DHA의 합', '오메가 3 지방산',
       '오메가 6 지방산', '트랜스 지방산', '트랜스 올레산(18:1(n-9)t)',
       '트랜스 리놀레산 (18:2t)', '트랜스 리놀렌산(18:3t)',
       '냉산가용성물질', '총 불포화지방산', '식염상당량', '회분',
       '카페인']]


In [34]:
food_nutrients_copy1.columns

Index(['NO', 'DB군', '상용제품', '식품명', '식품대분류', '식품상세분류', '1회제공량', '단위', '총내용량(g)',
       '총내용량(mL)', '에너지', '수분', '단백질', '지방', '탄수화물', '총당류', '자당', '포도당', '과당',
       '유당', '맥아당', '갈락토오스', '당알콜', '에리스리톨', '총 식이섬유', '총 식이섬유', '수용성 식이섬유',
       '불용성 식이섬유', '칼슘', '철', '마그네슘', '인', '칼륨', '나트륨', '아연', '구리', '망간',
       '셀레늄', '몰리브덴', '요오드', '염소', '비타민 A', '비타민 A(RE)', '레티놀', '베타카로틴',
       '레티놀A효능', '비타민 D(D2+D3)', '비타민 D2', '비타민 D3', '비타민 D1', '비타민 E',
       '비타민 E(α-TE)', '알파 토코페롤', '베타 토코페롤', '감마 토코페롤', '델타 토코페롤', '알파 토코트리에놀',
       '베타 토코트리에놀', '감마 토코트리에놀', '델타 토코트리에놀', '토코페롤', '토코트리에놀', '비타민 K',
       '비타민 K1', '비타민 K2', '비타민 B1', '비타민 B2', '나이아신', '나이아신(NE)', '나이아신(NE))',
       '나이아신(NE)(NE)', '니코틴산', '니코틴아마이드', '판토텐산', '비타민 B6', '피리독신', '비오틴',
       '엽산(DFE)', '엽산 - 천연 엽산', '엽산 - 합성 엽산', '비타민 B12', '비타민 C', '콜린',
       '총 아미노산', '필수 아미노산', '이소류신', '류신', '라이신', '메티오닌', '페닐알라닌', '트레오닌',
       '트립토판', '발린', '히스티딘', '아르기닌', '비필수 아미노산', '티로신', '시스테인', '알라닌',
       '아스파르트산', '글루탐

#### 나이아신 영양소 정제 

In [35]:
# food_nutrients_copy1[['나이아신', '나이아신(NE)', '나이아신(NE))','나이아신(NE)(NE)']]

food_nutrients_copy1['나이아신'] = food_nutrients_copy1['나이아신'].add(food_nutrients_copy1['나이아신(NE)'])
food_nutrients_copy1['나이아신(NE))'] = food_nutrients_copy1['나이아신(NE))'].add(food_nutrients_copy1['나이아신(NE)(NE)'])


In [36]:
food_nutrients_copy1 = food_nutrients_copy1.drop(['나이아신(NE)', '나이아신(NE)(NE)'], axis=1)

In [37]:
pd.set_option('display.max_rows', 200)
# food_nutrients_copy1 = food_nutrients_copy1.sort_values(['1회제공량', 'NO'], ascending=False)
# food_nutrients_copy4.head(50)

In [38]:
food_nutrients_copy.info()

<class 'pandas.core.frame.DataFrame'>
Int64Index: 49807 entries, 0 to 58596
Columns: 192 entries, NO to 카페인(㎎)
dtypes: float64(185), int64(1), object(6)
memory usage: 73.3+ MB


In [39]:
#1회제공량>=3000 & 단위 g인 row 모두 제거

food_nutrients_copy1 = food_nutrients_copy1[(food_nutrients_copy1['단위']=='mL')| ((food_nutrients_copy1['1회제공량']<=3000) & (food_nutrients_copy1['단위']=='g'))]
# food_nutrients_copy1.head()

In [40]:
food_nutrients_copy1.info()

<class 'pandas.core.frame.DataFrame'>
Int64Index: 49068 entries, 0 to 49806
Columns: 162 entries, NO to 카페인
dtypes: float64(155), int64(1), object(6)
memory usage: 61.0+ MB


In [41]:
print((food_nutrients_copy['1회제공량'] == food_nutrients_copy['총내용량(mL)']).sum())
print((food_nutrients_copy['총내용량(mL)']>0.0).sum())
print((food_nutrients_copy['1회제공량'] == food_nutrients_copy['총내용량(g)']).sum())
print((food_nutrients_copy['총내용량(g)']>0.0).sum())

(food_nutrients_copy['1회제공량'] != food_nutrients_copy['총내용량(mL)']).sum()

3834
6534
15324
29899


45973

### 총내용량(g)과 총내용량(mL) column을 list로 뽑아서 합침

In [42]:
tmp_1 = food_nutrients_copy1['총내용량(g)'].tolist()
tmp_2 = food_nutrients_copy1['총내용량(mL)'].tolist()
tmp_3 = []

for i in range(len(tmp_1)):
    if tmp_1[i] == 0:
        tmp_3.append(tmp_2[i])
    else:
        tmp_3.append(tmp_1[i])

In [43]:
food_nutrients_copy1 = food_nutrients_copy1.drop(['총내용량(g)', '총내용량(mL)'], axis=1)

In [44]:
food_nutrients_copy1['총내용량'] = tmp_3

In [45]:
food_nutrients_copy1.columns

Index(['NO', 'DB군', '상용제품', '식품명', '식품대분류', '식품상세분류', '1회제공량', '단위', '에너지',
       '수분', '단백질', '지방', '탄수화물', '총당류', '자당', '포도당', '과당', '유당', '맥아당',
       '갈락토오스', '당알콜', '에리스리톨', '총 식이섬유', '총 식이섬유', '수용성 식이섬유', '불용성 식이섬유',
       '칼슘', '철', '마그네슘', '인', '칼륨', '나트륨', '아연', '구리', '망간', '셀레늄', '몰리브덴',
       '요오드', '염소', '비타민 A', '비타민 A(RE)', '레티놀', '베타카로틴', '레티놀A효능',
       '비타민 D(D2+D3)', '비타민 D2', '비타민 D3', '비타민 D1', '비타민 E', '비타민 E(α-TE)',
       '알파 토코페롤', '베타 토코페롤', '감마 토코페롤', '델타 토코페롤', '알파 토코트리에놀', '베타 토코트리에놀',
       '감마 토코트리에놀', '델타 토코트리에놀', '토코페롤', '토코트리에놀', '비타민 K', '비타민 K1', '비타민 K2',
       '비타민 B1', '비타민 B2', '나이아신', '나이아신(NE))', '니코틴산', '니코틴아마이드', '판토텐산',
       '비타민 B6', '피리독신', '비오틴', '엽산(DFE)', '엽산 - 천연 엽산', '엽산 - 합성 엽산',
       '비타민 B12', '비타민 C', '콜린', '총 아미노산', '필수 아미노산', '이소류신', '류신', '라이신',
       '메티오닌', '페닐알라닌', '트레오닌', '트립토판', '발린', '히스티딘', '아르기닌', '비필수 아미노산',
       '티로신', '시스테인', '알라닌', '아스파르트산', '글루탐산', '글리신', '프롤린', '세린', '타우린',
       '글리신 베타인 ', '호마린', '

#### 총 내용량 위치 수정

In [46]:
food_nutrients_copy1 = food_nutrients_copy1.loc[:, ['NO', 'DB군', '상용제품', '식품명', '식품대분류', '식품상세분류', '1회제공량', '단위',
       '총내용량', '에너지', '수분', '단백질',
       '지방', '탄수화물', '총당류', '자당', '포도당',
       '과당', '유당', '맥아당', '갈락토오스', '당알콜', '에리스리톨',
       '총 식이섬유', '수용성 식이섬유', '불용성 식이섬유',
       '칼슘', '철', '마그네슘', '인', '칼륨',
       '나트륨', '아연', '구리', '망간', '셀레늄', '몰리브덴', '요오드',
       '염소', '비타민 A', '비타민 A(RE)', '레티놀', '베타카로틴', '레티놀A효능',
       '비타민 D(D2+D3)', '비타민 D2', '비타민 D3', '비타민 D1', '비타민 E',
       '비타민 E(α-TE)', '알파 토코페롤', '베타 토코페롤', '감마 토코페롤', '델타 토코페롤',
       '알파 토코트리에놀', '베타 토코트리에놀', '감마 토코트리에놀', '델타 토코트리에놀',
       '토코페롤', '토코트리에놀', '비타민 K', '비타민 K1', '비타민 K2',
       '비타민 B1', '비타민 B2', '나이아신', '나이아신(NE))', '니코틴산', '니코틴아마이드', '판토텐산', '비타민 B6',
       '피리독신', '비오틴', '엽산(DFE)', '엽산 - 천연 엽산', '엽산 - 합성 엽산',
       '비타민 B12', '비타민 C', '콜린', '총 아미노산', '필수 아미노산', '이소류신',
       '류신', '라이신', '메티오닌', '페닐알라닌', '트레오닌', '트립토판', '발린',
       '히스티딘', '아르기닌', '비필수 아미노산', '티로신', '시스테인', '알라닌',
       '아스파르트산', '글루탐산', '글리신', '프롤린', '세린', '타우린',
       '글리신 베타인 ', '호마린', '트리고넬린', '리보핵산', '데옥시리보핵산',
       '콜레스테롤', '총 지방산', '총 필수 지방산', '총 포화 지방산',
       '부티르산(4:0)', '카프로산(6:0)', '카프릴산(8:0)', '카프르산(10:0)',
       '라우르산(12:0)', '트라이데칸산(13:0)', '미리스트산(14:0)',
       '펜타데칸산(15:0)', '팔미트산(16:0)',
       '헵타데칸산(17:0)', '스테아르산(18:0)', '아라키드산(20:0)',
       '헨에이코산산(21:0)', '베헨산(22:0)', '트리코산산(23:0)',
       '리그노세르산(24:0)', '총 단일 불포화지방산',
       '미리스톨레산(14:1)', '팔미톨레산(16:1)',
       '헵타데센산(17:1)', '올레산(18:1(n-9))',
       '박센산(18:1(n-7))', '가돌레산(20:1)',
       '에루크산(22:1)', '네르본산(24:1)',
       '총 다중 불포화지방산', '리놀레산(18:2(n-6)c)',
       '알파 리놀렌산(18:3(n-3))',
       '감마 리놀렌산(18:3(n-6))', '에이코사디에노산(20:2(n-6))',
       '에이코사트리에노산(20:3(n-3))', '에이코사트리에노산(20:3(n-6))',
       '아라키돈산(20:4(n-6))',
       '에이코사테트라에노산(20:4(n-3))', '에이코사펜타에노산(20:5(n-3))',
       '도코사디에노산(22:2)', '도코사펜타에노산(22:5(n-3))',
       '도코사헥사에노산(22:6(n-3))',
       'EPA와 DHA의 합', '오메가 3 지방산',
       '오메가 6 지방산', '트랜스 지방산', '트랜스 올레산(18:1(n-9)t)',
       '트랜스 리놀레산 (18:2t)', '트랜스 리놀렌산(18:3t)',
       '냉산가용성물질', '총 불포화지방산', '식염상당량', '회분',
       '카페인']]

In [47]:
#index reset
food_nutrients_copy1.reset_index(level=0)
food_nutrients_copy1.reset_index(drop=True)

Unnamed: 0,NO,DB군,상용제품,식품명,식품대분류,식품상세분류,1회제공량,단위,총내용량,에너지,수분,단백질,지방,탄수화물,총당류,자당,포도당,과당,유당,맥아당,갈락토오스,당알콜,에리스리톨,총 식이섬유,총 식이섬유.1,수용성 식이섬유,불용성 식이섬유,칼슘,철,마그네슘,인,칼륨,나트륨,아연,구리,망간,셀레늄,몰리브덴,요오드,염소,비타민 A,비타민 A(RE),레티놀,베타카로틴,레티놀A효능,비타민 D(D2+D3),비타민 D2,비타민 D3,비타민 D1,비타민 E,비타민 E(α-TE),알파 토코페롤,베타 토코페롤,감마 토코페롤,델타 토코페롤,알파 토코트리에놀,베타 토코트리에놀,감마 토코트리에놀,델타 토코트리에놀,토코페롤,토코트리에놀,비타민 K,비타민 K1,비타민 K2,비타민 B1,비타민 B2,나이아신,나이아신(NE)),니코틴산,니코틴아마이드,판토텐산,비타민 B6,피리독신,비오틴,엽산(DFE),엽산 - 천연 엽산,엽산 - 합성 엽산,비타민 B12,비타민 C,콜린,총 아미노산,필수 아미노산,이소류신,류신,라이신,메티오닌,페닐알라닌,트레오닌,트립토판,발린,히스티딘,아르기닌,비필수 아미노산,티로신,시스테인,알라닌,아스파르트산,글루탐산,글리신,프롤린,세린,타우린,글리신 베타인,호마린,트리고넬린,리보핵산,데옥시리보핵산,콜레스테롤,총 지방산,총 필수 지방산,총 포화 지방산,부티르산(4:0),카프로산(6:0),카프릴산(8:0),카프르산(10:0),라우르산(12:0),트라이데칸산(13:0),미리스트산(14:0),펜타데칸산(15:0),팔미트산(16:0),헵타데칸산(17:0),스테아르산(18:0),아라키드산(20:0),헨에이코산산(21:0),베헨산(22:0),트리코산산(23:0),리그노세르산(24:0),총 단일 불포화지방산,미리스톨레산(14:1),팔미톨레산(16:1),헵타데센산(17:1),올레산(18:1(n-9)),박센산(18:1(n-7)),가돌레산(20:1),에루크산(22:1),네르본산(24:1),총 다중 불포화지방산,리놀레산(18:2(n-6)c),알파 리놀렌산(18:3(n-3)),감마 리놀렌산(18:3(n-6)),에이코사디에노산(20:2(n-6)),에이코사트리에노산(20:3(n-3)),에이코사트리에노산(20:3(n-6)),아라키돈산(20:4(n-6)),에이코사테트라에노산(20:4(n-3)),에이코사펜타에노산(20:5(n-3)),도코사디에노산(22:2),도코사펜타에노산(22:5(n-3)),도코사헥사에노산(22:6(n-3)),EPA와 DHA의 합,오메가 3 지방산,오메가 6 지방산,트랜스 지방산,트랜스 올레산(18:1(n-9)t),트랜스 리놀레산 (18:2t),트랜스 리놀렌산(18:3t),냉산가용성물질,총 불포화지방산,식염상당량,회분,카페인
0,1,음식,품목대표,꿩불고기,구이류,육류구이,500.0,g,0.0,368.800000,412.600000,33.500000,8.500000,39.700000,16.900000,7.200000,2.800000,2.800000,0.7,3.500000,0.0,0.0,0.0,9.800000,0.0,0.0,0.0,0.105610,4.000000e-06,0.08539,0.458050,1.243120,1.264310,0.00399,0.00032,0.00068,0.000048,0.0,0.0,0.0,0.0,0.0,0.000000,0.001425,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.00873,0.00006,0.0,0.0,0.0,0.000000,0.000330,0.003610,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.000063,0.0,0.0,0.000000,0.00299,0.0,0.0,0.0,1.284376,2.328599,2.484750,0.64519,1.274927,1.410841,0.0,1.367688,0.848539,2.205585,0.0,0.919806,0.276499,1.642381,2.781773,4.784606,1.419925,1.092295,1.264958,0.0,0.0,0.0,0.0,0.0,0.0,0.106180,0.0,0.0,1.900000,0.0,0.0,0.0,0.000000,0.007115,0.0,0.031784,0.0,1.283841,0.0,0.527395,0.029012,0.0,0.0,0.0,0.0,0.0,0.000000,0.081352,0.0,2.307721,0.113463,0.027976,0.0,0.0,0.0,3.236018,0.656723,0.018708,0.006649,0.0,0.000000,0.142840,0.0,0.000000,0.0,0.000000,0.023427,0.0,0.0,0.0,0.100000,0.018116,0.053416,0.000000,0.0,0.0,0.0,5.800000,0.0
1,2,음식,품목대표,닭갈비,구이류,육류구이,400.0,g,0.0,595.610000,276.400000,45.900000,25.800000,44.900000,21.200000,3.600000,5.900000,4.800000,0.0,6.900000,0.0,0.0,0.0,11.600000,0.0,0.0,0.0,0.098640,3.380000e-06,0.10442,0.505250,1.200240,1.535830,0.00355,0.00034,0.00097,0.000058,0.0,0.0,0.0,0.0,0.0,0.000039,0.002133,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.00682,0.00004,0.0,0.0,0.0,0.000240,0.000370,0.001230,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.000108,0.0,0.0,0.000001,0.00554,0.0,0.0,0.0,1.796242,3.245405,3.593312,0.87804,1.830141,2.019939,0.0,1.966315,1.198582,2.851723,0.0,1.310513,0.307730,2.465200,4.361761,7.778838,2.230079,1.865825,1.833386,0.0,0.0,0.0,0.0,0.0,0.0,0.193400,0.0,0.0,6.000000,0.0,0.0,0.0,0.001698,0.031794,0.0,0.179375,0.0,4.484837,0.0,1.270946,0.031975,0.0,0.0,0.0,0.0,0.0,0.050503,1.290263,0.0,8.115577,0.464756,0.082151,0.0,0.0,0.0,4.851294,0.443453,0.020732,0.026682,0.0,0.040331,0.127789,0.0,0.006143,0.0,0.015706,0.009782,0.0,0.0,0.0,0.200000,0.075049,0.064607,0.013211,0.0,0.0,0.0,7.000000,0.0
2,4,음식,품목대표,닭꼬치,구이류,육류구이,70.0,g,0.0,176.722661,35.307907,11.561723,8.565014,13.347661,3.152107,0.106114,0.816881,1.639979,0.0,0.589132,0.0,0.0,0.0,2.071708,0.0,0.0,0.0,0.017675,7.636918e-06,0.00000,0.122798,0.152663,0.286911,0.00000,0.00000,0.00000,0.000000,0.0,0.0,0.0,0.0,0.0,0.000015,0.000046,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.00000,0.00000,0.0,0.0,0.0,0.000226,0.000184,0.001713,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.000000,0.0,0.0,0.000000,0.00000,0.0,0.0,0.0,0.000000,0.000000,0.000000,0.00000,0.000000,0.000000,0.0,0.000000,0.000000,0.000000,0.0,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.0,0.0,0.0,0.0,0.0,0.0,0.031444,0.0,0.0,2.315328,0.0,0.0,0.0,0.000000,0.000000,0.0,0.100000,0.0,1.800000,0.0,0.500000,0.000000,0.0,0.0,0.0,0.0,0.0,0.000000,0.400000,0.0,3.300000,0.200000,0.000000,0.0,0.0,0.0,1.900000,0.200000,0.000000,0.000000,0.0,0.000000,0.000000,0.0,0.000000,0.0,0.000000,0.000000,0.0,0.0,0.0,0.043863,0.000000,0.000000,0.000000,0.0,0.0,0.0,1.217695,0.0
3,5,음식,품목대표,더덕구이,구이류,채소류구이,100.0,g,0.0,184.000000,58.100000,3.100000,5.200000,31.100000,11.600000,2.200000,2.700000,1.500000,0.0,5.100000,0.0,0.0,0.0,6.800000,0.0,0.0,0.0,0.046420,1.430000e-06,0.03821,0.088170,0.262440,0.743370,0.00059,0.00013,0.00042,0.000000,0.0,0.0,0.0,0.0,0.0,0.000000,0.000481,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.00389,0.00147,0.0,0.0,0.0,0.000230,0.000080,0.000180,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.000017,0.0,0.0,0.000000,0.00134,0.0,0.0,0.0,0.069840,0.126530,0.090720,0.01636,0.082780,0.070970,0.0,0.087910,0.044560,0.457030,0.0,0.033860,0.009730,0.091190,0.203150,0.620800,0.083580,0.117200,0.083490,0.0,0.0,0.0,0.0,0.0,0.0,0.000120,0.0,0.0,0.800000,0.0,0.0,0.0,0.000000,0.000000,0.0,0.000000,0.0,0.500000,0.0,0.200000,0.000000,0.0,0.0,0.0,0.0,0.0,0.000000,0.000000,0.0,1.300000,0.100000,0.000000,0.0,0.0,0.0,2.300000,0.400000,0.000000,0.000000,0.0,0.000000,0.000000,0.0,0.000000,0.0,0.000000,0.000000,0.0,0.0,0.0,0.000000,0.000000,0.000000,0.000000,0.0,0.0,0.0,2.500000,0.0
4,6,음식,품목대표,도미구이,구이류,어패류구이,250.0,g,0.0,397.000000,163.300000,61.100000,16.500000,2.100000,0.000000,0.000000,0.000000,0.000000,0.0,0.000000,0.0,0.0,0.0,5.900000,0.0,0.0,0.0,0.158800,9.700000e-07,0.12037,0.690910,1.108020,1.582170,0.00145,0.00006,0.00006,0.000281,0.0,0.0,0.0,0.0,0.0,0.000066,0.000002,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.00376,0.00000,0.0,0.0,0.0,0.000100,0.000270,0.006350,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.000038,0.0,0.0,0.000007,0.00084,0.0,0.0,0.0,2.139190,4.277880,4.920980,1.72516,2.222940,2.583860,0.0,2.388480,1.351760,3.926030,0.0,1.958540,0.481770,3.337830,5.706620,8.361830,3.076270,2.060240,2.382060,0.0,0.0,0.0,0.0,0.0,0.0,0.211240,0.0,0.0,3.800000,0.0,0.0,0.0,0.000000,0.000000,0.0,0.400000,0.0,2.500000,0.0,0.800000,0.100000,0.0,0.0,0.0,0.0,0.0,0.000000,0.600000,0.0,2.900000,0.400000,0.200000,0.0,0.0,0.0,1.900000,0.300000,0.000000,0.000000,0.0,0.100000,0.200000,0.0,0.600000,0.0,0.300000,1.600000,0.0,0.0,0.0,0.100000,0.000000,0.000000,0.100000,0.0,0.0,0.0,7.000000,0.0
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
49063,46408,가공식품,상용제품,라즈베리 쨈 (054249),잼,잼,100.0,g,320.0,190.000000,0.000000,0.500000,0.000000,47.000000,44.000000,0.000000,0.000000,0.000000,0.0,0.000000,0.0,0.0,0.0,0.000000,0.0,0.0,0.0,0.000000,0.000000e+00,0.00000,0.000000,0.000000,0.023000,0.00000,0.00000,0.00000,0.000000,0.0,0.0,0.0,0.0,0.0,0.000000,0.000000,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.00000,0.00000,0.0,0.0,0.0,0.000000,0.000000,0.000000,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.000000,0.0,0.0,0.000000,0.00000,0.0,0.0,0.0,0.000000,0.000000,0.000000,0.00000,0.000000,0.000000,0.0,0.000000,0.000000,0.000000,0.0,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.0,0.0,0.0,0.0,0.0,0.0,0.000000,0.0,0.0,0.000000,0.0,0.0,0.0,0.000000,0.000000,0.0,0.000000,0.0,0.000000,0.0,0.000000,0.000000,0.0,0.0,0.0,0.0,0.0,0.000000,0.000000,0.0,0.000000,0.000000,0.000000,0.0,0.0,0.0,0.000000,0.000000,0.000000,0.000000,0.0,0.000000,0.000000,0.0,0.000000,0.0,0.000000,0.000000,0.0,0.0,0.0,0.000000,0.000000,0.000000,0.000000,0.0,0.0,0.0,0.000000,0.0
49064,46409,가공식품,상용제품,밤 잼,기타잼,기타잼,100.0,g,320.0,230.000000,0.000000,1.120000,0.000000,57.000000,47.000000,0.000000,0.000000,0.000000,0.0,0.000000,0.0,0.0,0.0,0.000000,0.0,0.0,0.0,0.000000,0.000000e+00,0.00000,0.000000,0.000000,0.015000,0.00000,0.00000,0.00000,0.000000,0.0,0.0,0.0,0.0,0.0,0.000000,0.000000,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.00000,0.00000,0.0,0.0,0.0,0.000000,0.000000,0.000000,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.000000,0.0,0.0,0.000000,0.00000,0.0,0.0,0.0,0.000000,0.000000,0.000000,0.00000,0.000000,0.000000,0.0,0.000000,0.000000,0.000000,0.0,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.0,0.0,0.0,0.0,0.0,0.0,0.000000,0.0,0.0,0.000000,0.0,0.0,0.0,0.000000,0.000000,0.0,0.000000,0.0,0.000000,0.0,0.000000,0.000000,0.0,0.0,0.0,0.0,0.0,0.000000,0.000000,0.0,0.000000,0.000000,0.000000,0.0,0.0,0.0,0.000000,0.000000,0.000000,0.000000,0.0,0.000000,0.000000,0.0,0.000000,0.0,0.000000,0.000000,0.0,0.0,0.0,0.000000,0.000000,0.000000,0.000000,0.0,0.0,0.0,0.000000,0.0
49065,46410,가공식품,상용제품,블랙베리 쨈,잼,잼,100.0,g,320.0,190.000000,0.000000,0.700000,0.000000,47.000000,46.000000,0.000000,0.000000,0.000000,0.0,0.000000,0.0,0.0,0.0,0.000000,0.0,0.0,0.0,0.000000,0.000000e+00,0.00000,0.000000,0.000000,0.020000,0.00000,0.00000,0.00000,0.000000,0.0,0.0,0.0,0.0,0.0,0.000000,0.000000,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.00000,0.00000,0.0,0.0,0.0,0.000000,0.000000,0.000000,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.000000,0.0,0.0,0.000000,0.00000,0.0,0.0,0.0,0.000000,0.000000,0.000000,0.00000,0.000000,0.000000,0.0,0.000000,0.000000,0.000000,0.0,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.0,0.0,0.0,0.0,0.0,0.0,0.000000,0.0,0.0,0.000000,0.0,0.0,0.0,0.000000,0.000000,0.0,0.000000,0.0,0.000000,0.0,0.000000,0.000000,0.0,0.0,0.0,0.0,0.0,0.000000,0.000000,0.0,0.000000,0.000000,0.000000,0.0,0.0,0.0,0.000000,0.000000,0.000000,0.000000,0.0,0.000000,0.000000,0.0,0.000000,0.0,0.000000,0.000000,0.0,0.0,0.0,0.000000,0.000000,0.000000,0.000000,0.0,0.0,0.0,0.000000,0.0
49066,46411,가공식품,상용제품,블루베리 쨈,잼,잼,100.0,g,320.0,185.000000,0.000000,0.000000,0.000000,46.000000,45.000000,0.000000,0.000000,0.000000,0.0,0.000000,0.0,0.0,0.0,0.000000,0.0,0.0,0.0,0.000000,0.000000e+00,0.00000,0.000000,0.000000,0.015000,0.00000,0.00000,0.00000,0.000000,0.0,0.0,0.0,0.0,0.0,0.000000,0.000000,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.00000,0.00000,0.0,0.0,0.0,0.000000,0.000000,0.000000,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.000000,0.0,0.0,0.000000,0.00000,0.0,0.0,0.0,0.000000,0.000000,0.000000,0.00000,0.000000,0.000000,0.0,0.000000,0.000000,0.000000,0.0,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.0,0.0,0.0,0.0,0.0,0.0,0.000000,0.0,0.0,0.000000,0.0,0.0,0.0,0.000000,0.000000,0.0,0.000000,0.0,0.000000,0.0,0.000000,0.000000,0.0,0.0,0.0,0.0,0.0,0.000000,0.000000,0.0,0.000000,0.000000,0.000000,0.0,0.0,0.0,0.000000,0.000000,0.000000,0.000000,0.0,0.000000,0.000000,0.0,0.000000,0.0,0.000000,0.000000,0.0,0.0,0.0,0.000000,0.000000,0.000000,0.000000,0.0,0.0,0.0,0.000000,0.0


## 1회 제공량 및 총 내용량 비교후 통합

In [48]:
food_nutrients_copy2 = food_nutrients_copy1.copy()
food_nutrients_copy3 = food_nutrients_copy1.copy()

#### 총 당류, 총 식이섬유 등 영양소의 합계를 나타내는 column들 모두 제거 (전체 영양소 합계 계산할 때 편하게 하기위해)

In [49]:
food_nutrients_copy1 = food_nutrients_copy1.loc[:, ['NO', 'DB군', '상용제품', '식품명', '식품대분류', '식품상세분류', '1회제공량', '단위',
       '총내용량', '에너지', '수분', '단백질',
       '지방', '탄수화물', '자당', '포도당',
       '과당', '유당', '맥아당', '갈락토오스', '당알콜', '에리스리톨',
       '수용성 식이섬유', '불용성 식이섬유',
       '칼슘', '철', '마그네슘', '인', '칼륨',
       '나트륨', '아연', '구리', '망간', '셀레늄', '몰리브덴', '요오드',
       '염소', '비타민 A', '비타민 A(RE)', '레티놀', '베타카로틴', '레티놀A효능',
       '비타민 D(D2+D3)', '비타민 D2', '비타민 D3', '비타민 D1', '비타민 E',
       '비타민 E(α-TE)', '알파 토코페롤', '베타 토코페롤', '감마 토코페롤', '델타 토코페롤',
       '알파 토코트리에놀', '베타 토코트리에놀', '감마 토코트리에놀', '델타 토코트리에놀',
       '토코페롤', '토코트리에놀', '비타민 K', '비타민 K1', '비타민 K2',
       '비타민 B1', '비타민 B2', '나이아신', '나이아신(NE))', '니코틴산', '니코틴아마이드', '판토텐산', '비타민 B6',
       '피리독신', '비오틴', '엽산(DFE)', '엽산 - 천연 엽산', '엽산 - 합성 엽산',
       '비타민 B12', '비타민 C', '콜린', '필수 아미노산', '이소류신',
       '류신', '라이신', '메티오닌', '페닐알라닌', '트레오닌', '트립토판', '발린',
       '히스티딘', '아르기닌', '비필수 아미노산', '티로신', '시스테인', '알라닌',
       '아스파르트산', '글루탐산', '글리신', '프롤린', '세린', '타우린',
       '글리신 베타인 ', '호마린', '트리고넬린', '리보핵산', '데옥시리보핵산',
       '콜레스테롤',
       '부티르산(4:0)', '카프로산(6:0)', '카프릴산(8:0)', '카프르산(10:0)',
       '라우르산(12:0)', '트라이데칸산(13:0)', '미리스트산(14:0)',
       '펜타데칸산(15:0)', '팔미트산(16:0)',
       '헵타데칸산(17:0)', '스테아르산(18:0)', '아라키드산(20:0)',
       '헨에이코산산(21:0)', '베헨산(22:0)', '트리코산산(23:0)',
       '리그노세르산(24:0)',
       '미리스톨레산(14:1)', '팔미톨레산(16:1)',
       '헵타데센산(17:1)', '올레산(18:1(n-9))',
       '박센산(18:1(n-7))', '가돌레산(20:1)',
       '에루크산(22:1)', '네르본산(24:1)',
       '리놀레산(18:2(n-6)c)',
       '알파 리놀렌산(18:3(n-3))',
       '감마 리놀렌산(18:3(n-6))', '에이코사디에노산(20:2(n-6))',
       '에이코사트리에노산(20:3(n-3))', '에이코사트리에노산(20:3(n-6))',
       '아라키돈산(20:4(n-6))',
       '에이코사테트라에노산(20:4(n-3))', '에이코사펜타에노산(20:5(n-3))',
       '도코사디에노산(22:2)', '도코사펜타에노산(22:5(n-3))',
       '도코사헥사에노산(22:6(n-3))',
       'EPA와 DHA의 합', '오메가 3 지방산',
       '오메가 6 지방산', '트랜스 지방산', '트랜스 올레산(18:1(n-9)t)',
       '트랜스 리놀레산 (18:2t)', '트랜스 리놀렌산(18:3t)',
       '냉산가용성물질',
       '카페인']]

In [50]:
# 식품별 총영양소량 구해서 list 생성 -> list_1
list_1 = []
for i in range(len(food_nutrients_copy1.index)):
    summation = 0
    for j in range(9, len(food_nutrients_copy1.columns)):
        summation += food_nutrients_copy1.iloc[i,j]
    list_1.append(summation)

In [51]:
# '1회제공량 < 총영양소량'인 식품 list 생성 -> indexes
# 1회제공량 list 생성 -> list_0
indexes = []
list_0 = food_nutrients_copy1['1회제공량'].tolist()
for i in range(len(list_0)):
    if list_0[i] < list_1[i]:
        indexes.append(i)
    else:
        pass

In [52]:
# list_1에 속한 식품들의 1회제공량을 총내용량으로 대체 -> list_0
for index in indexes:
    list_0[index] = list_1[index]

In [53]:
# 총내용량 column 삭제
food_nutrients_copy2 = food_nutrients_copy2.drop(['총내용량'], axis=1)
food_nutrients_copy2.columns

Index(['NO', 'DB군', '상용제품', '식품명', '식품대분류', '식품상세분류', '1회제공량', '단위', '에너지',
       '수분', '단백질', '지방', '탄수화물', '총당류', '자당', '포도당', '과당', '유당', '맥아당',
       '갈락토오스', '당알콜', '에리스리톨', '총 식이섬유', '총 식이섬유', '수용성 식이섬유', '불용성 식이섬유',
       '칼슘', '철', '마그네슘', '인', '칼륨', '나트륨', '아연', '구리', '망간', '셀레늄', '몰리브덴',
       '요오드', '염소', '비타민 A', '비타민 A(RE)', '레티놀', '베타카로틴', '레티놀A효능',
       '비타민 D(D2+D3)', '비타민 D2', '비타민 D3', '비타민 D1', '비타민 E', '비타민 E(α-TE)',
       '알파 토코페롤', '베타 토코페롤', '감마 토코페롤', '델타 토코페롤', '알파 토코트리에놀', '베타 토코트리에놀',
       '감마 토코트리에놀', '델타 토코트리에놀', '토코페롤', '토코트리에놀', '비타민 K', '비타민 K1', '비타민 K2',
       '비타민 B1', '비타민 B2', '나이아신', '나이아신(NE))', '니코틴산', '니코틴아마이드', '판토텐산',
       '비타민 B6', '피리독신', '비오틴', '엽산(DFE)', '엽산 - 천연 엽산', '엽산 - 합성 엽산',
       '비타민 B12', '비타민 C', '콜린', '총 아미노산', '필수 아미노산', '이소류신', '류신', '라이신',
       '메티오닌', '페닐알라닌', '트레오닌', '트립토판', '발린', '히스티딘', '아르기닌', '비필수 아미노산',
       '티로신', '시스테인', '알라닌', '아스파르트산', '글루탐산', '글리신', '프롤린', '세린', '타우린',
       '글리신 베타인 ', '호마린', '

In [54]:
#1회제공량 column을 list_0으로 대체
food_nutrients_copy2['1회제공량'] = list_0

In [55]:
#food_nutrients_copy5.to_excel('통합 식품영양성분DB_20211116정현우.xlsx')

In [56]:
food_nutrients_copy2.info()

<class 'pandas.core.frame.DataFrame'>
Int64Index: 49068 entries, 0 to 49806
Columns: 160 entries, NO to 카페인
dtypes: float64(153), int64(1), object(6)
memory usage: 60.3+ MB


#### 영양소별 총 제공량 분류

In [57]:
columns = food_nutrients_copy2.columns
new_columns = []
for name in columns:
    if name[0] == '총':
            new_columns.append(name)
new_columns

['총당류',
 '총 식이섬유',
 '총 식이섬유',
 '총 아미노산',
 '총 지방산',
 '총 필수 지방산',
 '총 포화 지방산',
 '총 단일 불포화지방산',
 '총 다중 불포화지방산',
 '총 불포화지방산']

In [58]:
food_nutrients_copy3 = food_nutrients_copy3.loc[:, ['NO', 'DB군', '상용제품', '식품명', '식품대분류', '식품상세분류', '1회제공량', '단위',
        '수분', '단백질',
       '지방', '탄수화물', '총 식이섬유',
     '총 아미노산',
     '총 지방산',
     '총 필수 지방산',
     '총 포화 지방산',
     '총 단일 불포화지방산',
     '총 다중 불포화지방산',
     '총 불포화지방산',  '식염상당량', '회분']]
food_nutrients_copy3 = food_nutrients_copy3.sort_values(['1회제공량'], ascending=True)
food_nutrients_copy3.head()      

Unnamed: 0,NO,DB군,상용제품,식품명,식품대분류,식품상세분류,1회제공량,단위,수분,단백질,지방,탄수화물,총 식이섬유,총 식이섬유.1,총 아미노산,총 지방산,총 필수 지방산,총 포화 지방산,총 단일 불포화지방산,총 다중 불포화지방산,총 불포화지방산,식염상당량,회분
43685,39260,가공식품,상용제품,에티켓(레몬향),캔디류,캔디류,0.03,g,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
43790,39395,가공식품,상용제품,JW중외모링가플러스,캔디류,캔디류,0.3,g,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
43821,39429,가공식품,상용제품,타트체리 정,캔디류,캔디류,0.5,g,0.0,0.0,0.0,0.5,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
43817,39425,가공식품,상용제품,프리바이오틱스정,캔디류,캔디류,0.5,g,0.0,0.0,0.0,0.7,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
43843,39451,가공식품,상용제품,참 착한 보스웰리아정,캔디류,캔디류,0.5,g,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0


In [59]:
#food_nutrients_copy6.to_excel('통합 식품영양성분DB_bygroup.xlsx')

In [60]:
# food_nutrients_copy2 = food_nutrients_copy2.drop(['총내용량'], axis=1)

# food_nutrients_copy2['1회제공량'] = food_nutrients_copy2['1회제공량'].round(6)

# food_nutrients_copy2.loc[:,'에너지': '카페인'] = \ 
# food_nutrients_copy2.loc[:,'에너지': '카페인'].round(6)

# food_nutrients_copy2.to_csv('food_db.csv', mode='w')

In [61]:
df = food_nutrients_copy2.copy()

In [62]:
df.columns

Index(['NO', 'DB군', '상용제품', '식품명', '식품대분류', '식품상세분류', '1회제공량', '단위', '에너지',
       '수분', '단백질', '지방', '탄수화물', '총당류', '자당', '포도당', '과당', '유당', '맥아당',
       '갈락토오스', '당알콜', '에리스리톨', '총 식이섬유', '총 식이섬유', '수용성 식이섬유', '불용성 식이섬유',
       '칼슘', '철', '마그네슘', '인', '칼륨', '나트륨', '아연', '구리', '망간', '셀레늄', '몰리브덴',
       '요오드', '염소', '비타민 A', '비타민 A(RE)', '레티놀', '베타카로틴', '레티놀A효능',
       '비타민 D(D2+D3)', '비타민 D2', '비타민 D3', '비타민 D1', '비타민 E', '비타민 E(α-TE)',
       '알파 토코페롤', '베타 토코페롤', '감마 토코페롤', '델타 토코페롤', '알파 토코트리에놀', '베타 토코트리에놀',
       '감마 토코트리에놀', '델타 토코트리에놀', '토코페롤', '토코트리에놀', '비타민 K', '비타민 K1', '비타민 K2',
       '비타민 B1', '비타민 B2', '나이아신', '나이아신(NE))', '니코틴산', '니코틴아마이드', '판토텐산',
       '비타민 B6', '피리독신', '비오틴', '엽산(DFE)', '엽산 - 천연 엽산', '엽산 - 합성 엽산',
       '비타민 B12', '비타민 C', '콜린', '총 아미노산', '필수 아미노산', '이소류신', '류신', '라이신',
       '메티오닌', '페닐알라닌', '트레오닌', '트립토판', '발린', '히스티딘', '아르기닌', '비필수 아미노산',
       '티로신', '시스테인', '알라닌', '아스파르트산', '글루탐산', '글리신', '프롤린', '세린', '타우린',
       '글리신 베타인 ', '호마린', '

In [63]:
df['에너지'].dtypes

dtype('float64')

In [64]:
df = df.loc[:, ['식품명', '식품대분류', '식품상세분류', '1회제공량', '에너지', '단백질', '지방', '탄수화물', '총당류', '칼슘', '인',\
                        '철', '나트륨', '칼륨', '비타민 A', '비타민 B1', '비타민 B2', '나이아신', '비타민 C', '엽산(DFE)']]

In [65]:
df.loc[:,'1회제공량': '엽산(DFE)'] = df.loc[:,'1회제공량': '엽산(DFE)'].round(6)

In [66]:
# df = df.sort_values(by=['식품명'])

In [67]:
# df.to_csv("sort_food.csv", mode='w')

In [68]:
# df['식품명'].tolist().to_csv('food_name_list',encoding='euc-kr')

In [69]:
# import csv

# with open('food_name_list.csv','w',encoding='utf-8' ) as file :
#     write = csv.writer(file)
#     write.writerow(df['식품명'].tolist())