# Section 4. Working with DataFrames

In [2]:
import pandas as pd
import numpy as np

## 66. Section intro

## 67. What is a DataFrame

In [5]:
#some python list

names = ['Olga','Andrew','Brian','Telulah','Nicole','Tilda']
ages = [29,21,25,23,25,26]
married = [True, False, False, False, True, True]

In [6]:
ser = pd.Series(names, name='names')
ser

0       Olga
1     Andrew
2      Brian
3    Telulah
4     Nicole
5      Tilda
Name: names, dtype: object

In [7]:
df = pd.DataFrame({'name':names,'ages':ages,'married':married})
df

Unnamed: 0,name,ages,married
0,Olga,29,True
1,Andrew,21,False
2,Brian,25,False
3,Telulah,23,False
4,Nicole,25,True
5,Tilda,26,True


In [8]:
ser[2]

'Brian'

In [9]:
df.iloc[2,0]

'Brian'

In [10]:
ser.ndim

1

In [11]:
df.ndim

2

## 68. Creating A DataFrame

In [13]:
names

['Olga', 'Andrew', 'Brian', 'Telulah', 'Nicole', 'Tilda']

In [14]:
ages

[29, 21, 25, 23, 25, 26]

In [15]:
married

[True, False, False, False, True, True]

In [16]:
pd.DataFrame({'name':names,'ages':ages,'married':married})

Unnamed: 0,name,ages,married
0,Olga,29,True
1,Andrew,21,False
2,Brian,25,False
3,Telulah,23,False
4,Nicole,25,True
5,Tilda,26,True


In [17]:
new_names = names + ['Ryan']

In [18]:
len(names)

6

In [19]:
len(new_names)

7

In [20]:
# pd.DataFrame({'name':new_names,'ages':ages,'married':married})

## 69. BONUS - Four More Ways To Build DataFrames

In [22]:
#dict of tuples

In [23]:
tuple_names = tuple(names)
tuple_ages = tuple(ages)
tuple_married = tuple(married)

In [24]:
tuple_names

('Olga', 'Andrew', 'Brian', 'Telulah', 'Nicole', 'Tilda')

In [25]:
pd.DataFrame({'name':tuple_names,
              'ages':tuple_ages,
              'married':tuple_married})

Unnamed: 0,name,ages,married
0,Olga,29,True
1,Andrew,21,False
2,Brian,25,False
3,Telulah,23,False
4,Nicole,25,True
5,Tilda,26,True


In [26]:
#dict of series 
series_names = pd.Series(names)
series_ages = pd.Series(ages)
series_married = pd.Series(married)


In [27]:
pd.DataFrame({'name':series_names,
              'ages':series_ages,
              'married':series_married})

Unnamed: 0,name,ages,married
0,Olga,29,True
1,Andrew,21,False
2,Brian,25,False
3,Telulah,23,False
4,Nicole,25,True
5,Tilda,26,True


In [28]:
pd.DataFrame({'names':['Olga','Mike']})

Unnamed: 0,names
0,Olga
1,Mike


In [29]:
pd.DataFrame({'names':{0:'Olga',1:'Mike'}})

Unnamed: 0,names
0,Olga
1,Mike


In [30]:
#enumerate function
list(enumerate(names))

[(0, 'Olga'),
 (1, 'Andrew'),
 (2, 'Brian'),
 (3, 'Telulah'),
 (4, 'Nicole'),
 (5, 'Tilda')]

In [31]:
#dict_names = {k:v for k,v in enumerate(names)}
#dict_names

In [32]:
#dict_ages = {k:v for k,v in enumerate(ages)}
#dict_married = {k:v for k,v in enumerate(married)}

In [33]:
def convert_list_to_dict(l):
    return {k:v for k,v in enumerate(l)}

In [34]:
dict_names = convert_list_to_dict(names)
dict_ages = convert_list_to_dict(ages)
dict_married = convert_list_to_dict(married)

In [35]:
dict_ages

{0: 29, 1: 21, 2: 25, 3: 23, 4: 25, 5: 26}

In [36]:
pd.DataFrame({'name':dict_names,
              'ages':dict_ages,
              'married':dict_married})

Unnamed: 0,name,ages,married
0,Olga,29,True
1,Andrew,21,False
2,Brian,25,False
3,Telulah,23,False
4,Nicole,25,True
5,Tilda,26,True


In [37]:
pd.DataFrame([{'name':'Olga',
              'ages':29,
              'married':False}])

Unnamed: 0,name,ages,married
0,Olga,29,False


In [38]:
list(zip(names,ages,married))

[('Olga', 29, True),
 ('Andrew', 21, False),
 ('Brian', 25, False),
 ('Telulah', 23, False),
 ('Nicole', 25, True),
 ('Tilda', 26, True)]

In [39]:
rowwise = [{'name':name,'ages':ages,'married':married} for name, ages, married in zip(names, ages,married)]

In [40]:
pd.DataFrame(rowwise)

Unnamed: 0,name,ages,married
0,Olga,29,True
1,Andrew,21,False
2,Brian,25,False
3,Telulah,23,False
4,Nicole,25,True
5,Tilda,26,True


## 70. The info() method

In [42]:
df.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 6 entries, 0 to 5
Data columns (total 3 columns):
 #   Column   Non-Null Count  Dtype 
---  ------   --------------  ----- 
 0   name     6 non-null      object
 1   ages     6 non-null      int64 
 2   married  6 non-null      bool  
dtypes: bool(1), int64(1), object(1)
memory usage: 234.0+ bytes


In [43]:
df.info(verbose=False)

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 6 entries, 0 to 5
Columns: 3 entries, name to married
dtypes: bool(1), int64(1), object(1)
memory usage: 234.0+ bytes


In [44]:
df.info(max_cols=2)

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 6 entries, 0 to 5
Columns: 3 entries, name to married
dtypes: bool(1), int64(1), object(1)
memory usage: 234.0+ bytes


In [45]:
df.info(memory_usage='deep')

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 6 entries, 0 to 5
Data columns (total 3 columns):
 #   Column   Non-Null Count  Dtype 
---  ------   --------------  ----- 
 0   name     6 non-null      object
 1   ages     6 non-null      int64 
 2   married  6 non-null      bool  
dtypes: bool(1), int64(1), object(1)
memory usage: 513.0 bytes


## 71. Reading a nutricion data

In [47]:
nutrition = pd.read_csv('nutrition.csv')

In [48]:
nutrition.head(10)

Unnamed: 0.1,Unnamed: 0,name,serving_size,calories,total_fat,saturated_fat,cholesterol,sodium,choline,folate,...,fat,saturated_fatty_acids,monounsaturated_fatty_acids,polyunsaturated_fatty_acids,fatty_acids_total_trans,alcohol,ash,caffeine,theobromine,water
0,0,Cornstarch,100 g,381,0.1g,,0,9.00 mg,0.4 mg,0.00 mcg,...,0.05 g,0.009 g,0.016 g,0.025 g,0.00 mg,0.0 g,0.09 g,0.00 mg,0.00 mg,8.32 g
1,1,"Nuts, pecans",100 g,691,72g,6.2g,0,0.00 mg,40.5 mg,22.00 mcg,...,71.97 g,6.180 g,40.801 g,21.614 g,0.00 mg,0.0 g,1.49 g,0.00 mg,0.00 mg,3.52 g
2,2,"Eggplant, raw",100 g,25,0.2g,,0,2.00 mg,6.9 mg,22.00 mcg,...,0.18 g,0.034 g,0.016 g,0.076 g,0.00 mg,0.0 g,0.66 g,0.00 mg,0.00 mg,92.30 g
3,3,"Teff, uncooked",100 g,367,2.4g,0.4g,0,12.00 mg,13.1 mg,0,...,2.38 g,0.449 g,0.589 g,1.071 g,0,0,2.37 g,0,0,8.82 g
4,4,"Sherbet, orange",100 g,144,2g,1.2g,1mg,46.00 mg,7.7 mg,4.00 mcg,...,2.00 g,1.160 g,0.530 g,0.080 g,1.00 mg,0.0 g,0.40 g,0.00 mg,0.00 mg,66.10 g
5,5,"Cauliflower, raw",100 g,25,0.3g,0.1g,0,30.00 mg,44.3 mg,57.00 mcg,...,0.28 g,0.130 g,0.034 g,0.031 g,0.00 mg,0.0 g,0.76 g,0.00 mg,0.00 mg,92.07 g
6,6,"Taro leaves, raw",100 g,42,0.7g,0.2g,0,3.00 mg,12.8 mg,126.00 mcg,...,0.74 g,0.151 g,0.060 g,0.307 g,0.00 mg,0.0 g,1.92 g,0.00 mg,0.00 mg,85.66 g
7,7,"Lamb, raw, ground",100 g,282,23g,10g,73mg,59.00 mg,69.3 mg,18.00 mcg,...,23.41 g,10.190 g,9.600 g,1.850 g,73.00 mg,0.0 g,0.87 g,0.00 mg,0.00 mg,59.47 g
8,8,"Cheese, camembert",100 g,300,24g,15g,72mg,842.00 mg,15.4 mg,62.00 mcg,...,24.26 g,15.259 g,7.023 g,0.724 g,72.00 mg,0.0 g,3.68 g,0.00 mg,0.00 mg,51.80 g
9,9,Vegetarian fillets,100 g,290,18g,2.8g,0,490.00 mg,82.0 mg,102.00 mcg,...,18.00 g,2.849 g,4.376 g,9.332 g,0.00 mg,0.0 g,5.00 g,0.00 mg,0.00 mg,45.00 g


In [49]:
nutrition.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 8789 entries, 0 to 8788
Data columns (total 77 columns):
 #   Column                       Non-Null Count  Dtype 
---  ------                       --------------  ----- 
 0   Unnamed: 0                   8789 non-null   int64 
 1   name                         8789 non-null   object
 2   serving_size                 8789 non-null   object
 3   calories                     8789 non-null   int64 
 4   total_fat                    8789 non-null   object
 5   saturated_fat                7199 non-null   object
 6   cholesterol                  8789 non-null   object
 7   sodium                       8789 non-null   object
 8   choline                      8789 non-null   object
 9   folate                       8789 non-null   object
 10  folic_acid                   8789 non-null   object
 11  niacin                       8789 non-null   object
 12  pantothenic_acid             8789 non-null   object
 13  riboflavin                   8789

In [50]:
nutrition.info(verbose=False, memory_usage='deep')

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 8789 entries, 0 to 8788
Columns: 77 entries, Unnamed: 0 to water
dtypes: int64(3), object(74)
memory usage: 34.3 MB


## 72. Some cleanup. Removing the duplicate index

In [52]:
nutrition.head()

Unnamed: 0.1,Unnamed: 0,name,serving_size,calories,total_fat,saturated_fat,cholesterol,sodium,choline,folate,...,fat,saturated_fatty_acids,monounsaturated_fatty_acids,polyunsaturated_fatty_acids,fatty_acids_total_trans,alcohol,ash,caffeine,theobromine,water
0,0,Cornstarch,100 g,381,0.1g,,0,9.00 mg,0.4 mg,0.00 mcg,...,0.05 g,0.009 g,0.016 g,0.025 g,0.00 mg,0.0 g,0.09 g,0.00 mg,0.00 mg,8.32 g
1,1,"Nuts, pecans",100 g,691,72g,6.2g,0,0.00 mg,40.5 mg,22.00 mcg,...,71.97 g,6.180 g,40.801 g,21.614 g,0.00 mg,0.0 g,1.49 g,0.00 mg,0.00 mg,3.52 g
2,2,"Eggplant, raw",100 g,25,0.2g,,0,2.00 mg,6.9 mg,22.00 mcg,...,0.18 g,0.034 g,0.016 g,0.076 g,0.00 mg,0.0 g,0.66 g,0.00 mg,0.00 mg,92.30 g
3,3,"Teff, uncooked",100 g,367,2.4g,0.4g,0,12.00 mg,13.1 mg,0,...,2.38 g,0.449 g,0.589 g,1.071 g,0,0,2.37 g,0,0,8.82 g
4,4,"Sherbet, orange",100 g,144,2g,1.2g,1mg,46.00 mg,7.7 mg,4.00 mcg,...,2.00 g,1.160 g,0.530 g,0.080 g,1.00 mg,0.0 g,0.40 g,0.00 mg,0.00 mg,66.10 g


In [53]:
nutrition['Unnamed: 0']

0          0
1          1
2          2
3          3
4          4
        ... 
8784    8784
8785    8785
8786    8786
8787    8787
8788    8788
Name: Unnamed: 0, Length: 8789, dtype: int64

In [54]:
nutrition.drop('Unnamed: 0', axis=1)

Unnamed: 0,name,serving_size,calories,total_fat,saturated_fat,cholesterol,sodium,choline,folate,folic_acid,...,fat,saturated_fatty_acids,monounsaturated_fatty_acids,polyunsaturated_fatty_acids,fatty_acids_total_trans,alcohol,ash,caffeine,theobromine,water
0,Cornstarch,100 g,381,0.1g,,0,9.00 mg,0.4 mg,0.00 mcg,0.00 mcg,...,0.05 g,0.009 g,0.016 g,0.025 g,0.00 mg,0.0 g,0.09 g,0.00 mg,0.00 mg,8.32 g
1,"Nuts, pecans",100 g,691,72g,6.2g,0,0.00 mg,40.5 mg,22.00 mcg,0.00 mcg,...,71.97 g,6.180 g,40.801 g,21.614 g,0.00 mg,0.0 g,1.49 g,0.00 mg,0.00 mg,3.52 g
2,"Eggplant, raw",100 g,25,0.2g,,0,2.00 mg,6.9 mg,22.00 mcg,0.00 mcg,...,0.18 g,0.034 g,0.016 g,0.076 g,0.00 mg,0.0 g,0.66 g,0.00 mg,0.00 mg,92.30 g
3,"Teff, uncooked",100 g,367,2.4g,0.4g,0,12.00 mg,13.1 mg,0,0,...,2.38 g,0.449 g,0.589 g,1.071 g,0,0,2.37 g,0,0,8.82 g
4,"Sherbet, orange",100 g,144,2g,1.2g,1mg,46.00 mg,7.7 mg,4.00 mcg,0.00 mcg,...,2.00 g,1.160 g,0.530 g,0.080 g,1.00 mg,0.0 g,0.40 g,0.00 mg,0.00 mg,66.10 g
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
8784,"Beef, raw, all grades, trimmed to 0"" fat, sepa...",100 g,125,3.5g,1.4g,62mg,54.00 mg,64.5 mg,4.00 mcg,0.00 mcg,...,3.50 g,1.353 g,1.554 g,0.244 g,62.00 mg,0.0 g,1.11 g,0.00 mg,0.00 mg,72.51 g
8785,"Lamb, cooked, separable lean only, composite o...",100 g,206,8.9g,3.9g,109mg,50.00 mg,0,0.00 mcg,0.00 mcg,...,8.86 g,3.860 g,3.480 g,0.520 g,109.00 mg,0,1.60 g,0,0,59.95 g
8786,"Lamb, raw, separable lean and fat, composite o...",100 g,277,23g,12g,78mg,39.00 mg,0,1.00 mcg,0.00 mcg,...,22.74 g,11.570 g,8.720 g,0.980 g,78.00 mg,0,0.92 g,0,0,59.80 g
8787,"Beef, raw, all grades, trimmed to 0"" fat, sepa...",100 g,121,3g,1.1g,60mg,53.00 mg,64.2 mg,4.00 mcg,0.00 mcg,...,3.04 g,1.086 g,1.266 g,0.233 g,60.00 mg,0.0 g,1.10 g,0.00 mg,0.00 mg,73.43 g


In [55]:
nutrition.set_index('Unnamed: 0')

Unnamed: 0_level_0,name,serving_size,calories,total_fat,saturated_fat,cholesterol,sodium,choline,folate,folic_acid,...,fat,saturated_fatty_acids,monounsaturated_fatty_acids,polyunsaturated_fatty_acids,fatty_acids_total_trans,alcohol,ash,caffeine,theobromine,water
Unnamed: 0,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
0,Cornstarch,100 g,381,0.1g,,0,9.00 mg,0.4 mg,0.00 mcg,0.00 mcg,...,0.05 g,0.009 g,0.016 g,0.025 g,0.00 mg,0.0 g,0.09 g,0.00 mg,0.00 mg,8.32 g
1,"Nuts, pecans",100 g,691,72g,6.2g,0,0.00 mg,40.5 mg,22.00 mcg,0.00 mcg,...,71.97 g,6.180 g,40.801 g,21.614 g,0.00 mg,0.0 g,1.49 g,0.00 mg,0.00 mg,3.52 g
2,"Eggplant, raw",100 g,25,0.2g,,0,2.00 mg,6.9 mg,22.00 mcg,0.00 mcg,...,0.18 g,0.034 g,0.016 g,0.076 g,0.00 mg,0.0 g,0.66 g,0.00 mg,0.00 mg,92.30 g
3,"Teff, uncooked",100 g,367,2.4g,0.4g,0,12.00 mg,13.1 mg,0,0,...,2.38 g,0.449 g,0.589 g,1.071 g,0,0,2.37 g,0,0,8.82 g
4,"Sherbet, orange",100 g,144,2g,1.2g,1mg,46.00 mg,7.7 mg,4.00 mcg,0.00 mcg,...,2.00 g,1.160 g,0.530 g,0.080 g,1.00 mg,0.0 g,0.40 g,0.00 mg,0.00 mg,66.10 g
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
8784,"Beef, raw, all grades, trimmed to 0"" fat, sepa...",100 g,125,3.5g,1.4g,62mg,54.00 mg,64.5 mg,4.00 mcg,0.00 mcg,...,3.50 g,1.353 g,1.554 g,0.244 g,62.00 mg,0.0 g,1.11 g,0.00 mg,0.00 mg,72.51 g
8785,"Lamb, cooked, separable lean only, composite o...",100 g,206,8.9g,3.9g,109mg,50.00 mg,0,0.00 mcg,0.00 mcg,...,8.86 g,3.860 g,3.480 g,0.520 g,109.00 mg,0,1.60 g,0,0,59.95 g
8786,"Lamb, raw, separable lean and fat, composite o...",100 g,277,23g,12g,78mg,39.00 mg,0,1.00 mcg,0.00 mcg,...,22.74 g,11.570 g,8.720 g,0.980 g,78.00 mg,0,0.92 g,0,0,59.80 g
8787,"Beef, raw, all grades, trimmed to 0"" fat, sepa...",100 g,121,3g,1.1g,60mg,53.00 mg,64.2 mg,4.00 mcg,0.00 mcg,...,3.04 g,1.086 g,1.266 g,0.233 g,60.00 mg,0.0 g,1.10 g,0.00 mg,0.00 mg,73.43 g


In [56]:
nutrition = pd.read_csv('nutrition.csv', index_col='Unnamed: 0') #index_col=[0] same result
nutrition.head()

Unnamed: 0,name,serving_size,calories,total_fat,saturated_fat,cholesterol,sodium,choline,folate,folic_acid,...,fat,saturated_fatty_acids,monounsaturated_fatty_acids,polyunsaturated_fatty_acids,fatty_acids_total_trans,alcohol,ash,caffeine,theobromine,water
0,Cornstarch,100 g,381,0.1g,,0,9.00 mg,0.4 mg,0.00 mcg,0.00 mcg,...,0.05 g,0.009 g,0.016 g,0.025 g,0.00 mg,0.0 g,0.09 g,0.00 mg,0.00 mg,8.32 g
1,"Nuts, pecans",100 g,691,72g,6.2g,0,0.00 mg,40.5 mg,22.00 mcg,0.00 mcg,...,71.97 g,6.180 g,40.801 g,21.614 g,0.00 mg,0.0 g,1.49 g,0.00 mg,0.00 mg,3.52 g
2,"Eggplant, raw",100 g,25,0.2g,,0,2.00 mg,6.9 mg,22.00 mcg,0.00 mcg,...,0.18 g,0.034 g,0.016 g,0.076 g,0.00 mg,0.0 g,0.66 g,0.00 mg,0.00 mg,92.30 g
3,"Teff, uncooked",100 g,367,2.4g,0.4g,0,12.00 mg,13.1 mg,0,0,...,2.38 g,0.449 g,0.589 g,1.071 g,0,0,2.37 g,0,0,8.82 g
4,"Sherbet, orange",100 g,144,2g,1.2g,1mg,46.00 mg,7.7 mg,4.00 mcg,0.00 mcg,...,2.00 g,1.160 g,0.530 g,0.080 g,1.00 mg,0.0 g,0.40 g,0.00 mg,0.00 mg,66.10 g


## 73. The sample method

In [58]:
nutrition.sample()

Unnamed: 0,name,serving_size,calories,total_fat,saturated_fat,cholesterol,sodium,choline,folate,folic_acid,...,fat,saturated_fatty_acids,monounsaturated_fatty_acids,polyunsaturated_fatty_acids,fatty_acids_total_trans,alcohol,ash,caffeine,theobromine,water
327,"Turnip greens, raw",100 g,32,0.3g,0.1g,0,40.00 mg,0,194.00 mcg,0.00 mcg,...,0.30 g,0.070 g,0.020 g,0.120 g,0.00 mg,0.0 g,1.40 g,0.00 mg,0.00 mg,89.67 g


In [59]:
nutrition.sample(random_state=12) #same result for everyone

Unnamed: 0,name,serving_size,calories,total_fat,saturated_fat,cholesterol,sodium,choline,folate,folic_acid,...,fat,saturated_fatty_acids,monounsaturated_fatty_acids,polyunsaturated_fatty_acids,fatty_acids_total_trans,alcohol,ash,caffeine,theobromine,water
3713,"Thuringer, pork, beef, summer sausage, cervelat",100 g,362,30g,12g,74mg,1300.00 mg,78.9 mg,2.00 mcg,0.00 mcg,...,30.43 g,11.510 g,12.970 g,1.200 g,74.00 mg,0.0 g,3.63 g,0.00 mg,0.00 mg,45.18 g


In [60]:
nutrition.sample(frac=0.01)

Unnamed: 0,name,serving_size,calories,total_fat,saturated_fat,cholesterol,sodium,choline,folate,folic_acid,...,fat,saturated_fatty_acids,monounsaturated_fatty_acids,polyunsaturated_fatty_acids,fatty_acids_total_trans,alcohol,ash,caffeine,theobromine,water
7043,"Frozen novelties, and grape POPSICLE pops, che...",100 g,21,0g,,0,10.00 mg,0,0,0,...,0.00 g,0.000 g,0,0,0.00 mg,0,0.06 g,0,0,94.03 g
623,"Borage, raw",100 g,21,0.7g,0.2g,0,80.00 mg,0,13.00 mcg,0.00 mcg,...,0.70 g,0.170 g,0.211 g,0.109 g,0.00 mg,0,1.44 g,0,0,93.00 g
5520,"Pork, roasted, cooked, separable lean and fat,...",100 g,361,31g,9.2g,105mg,91.00 mg,71.0 mg,0.00 mcg,0,...,30.86 g,9.242 g,10.709 g,2.996 g,105.00 mg,0.0 g,0.82 g,0.00 mg,0.00 mg,48.11 g
3513,"MORNINGSTAR FARMS Veggie Dog, unprepared, frozen",100 g,126,1.3g,0.2g,0,1076.00 mg,0,2.00 mcg,0,...,1.30 g,0.200 g,0.200 g,0.600 g,0.00 mg,0,6.10 g,0,0,64.00 g
4238,"Snack, plain, made from dried potatoes, potato...",100 g,545,35g,8.6g,0,400.00 mg,32.8 mg,19.00 mcg,0.00 mcg,...,35.28 g,8.643 g,6.140 g,15.502 g,0.00 mg,0.0 g,2.34 g,0.00 mg,0.00 mg,2.37 g
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
6365,"Snacks, and E, C, with vitamins A, FARLEY Frui...",100 g,341,0g,,0,36.00 mg,0,0,0,...,0.00 g,0,0,0,0,0,0.00 g,0,0,14.70 g
4832,"Squash, without salt, baked, cooked, all varie...",100 g,37,0.4g,0.1g,0,1.00 mg,10.6 mg,20.00 mcg,0.00 mcg,...,0.35 g,0.072 g,0.026 g,0.147 g,0.00 mg,0.0 g,0.69 g,0.00 mg,0.00 mg,89.21 g
5722,"Beans, solids and liquids, seasoned, all style...",100 g,16,0.2g,,0,373.00 mg,0,18.00 mcg,0.00 mcg,...,0.20 g,0.045 g,0.008 g,0.102 g,0.00 mg,0,1.18 g,0,0,94.30 g
2177,"Butter replacement, powder, without fat",100 g,373,1g,0.6g,2mg,1200.00 mg,0.4 mg,0.00 mcg,0.00 mcg,...,1.00 g,0.589 g,0.276 g,0.057 g,2.00 mg,0.0 g,3.00 g,0.00 mg,0.00 mg,5.00 g


In [61]:
nutrition.shape[0]

8789

In [62]:
nutrition.shape[0] * 0.01

87.89

## 74. BONUS - Sampling With Replacement Or Weights

In [64]:
#weighted 
weights = pd.Series([10,10,10,1,2],index=[7,17,29,5,6])
weights


7     10
17    10
29    10
5      1
6      2
dtype: int64

In [65]:
nutrition.sample(n=3, weights=weights)

Unnamed: 0,name,serving_size,calories,total_fat,saturated_fat,cholesterol,sodium,choline,folate,folic_acid,...,fat,saturated_fatty_acids,monounsaturated_fatty_acids,polyunsaturated_fatty_acids,fatty_acids_total_trans,alcohol,ash,caffeine,theobromine,water
7,"Lamb, raw, ground",100 g,282,23g,10g,73mg,59.00 mg,69.3 mg,18.00 mcg,0.00 mcg,...,23.41 g,10.190 g,9.600 g,1.850 g,73.00 mg,0.0 g,0.87 g,0.00 mg,0.00 mg,59.47 g
17,"Peppers, raw, jalapeno",100 g,29,0.4g,0.1g,0,3.00 mg,7.5 mg,27.00 mcg,0.00 mcg,...,0.37 g,0.092 g,0.029 g,0.112 g,0.00 mg,0.0 g,0.53 g,0.00 mg,0.00 mg,91.69 g
6,"Taro leaves, raw",100 g,42,0.7g,0.2g,0,3.00 mg,12.8 mg,126.00 mcg,0.00 mcg,...,0.74 g,0.151 g,0.060 g,0.307 g,0.00 mg,0.0 g,1.92 g,0.00 mg,0.00 mg,85.66 g


## 75. BONUS - How Are Random Numbers Generated?

In [67]:
nutrition.sample(random_state=13)

Unnamed: 0,name,serving_size,calories,total_fat,saturated_fat,cholesterol,sodium,choline,folate,folic_acid,...,fat,saturated_fatty_acids,monounsaturated_fatty_acids,polyunsaturated_fatty_acids,fatty_acids_total_trans,alcohol,ash,caffeine,theobromine,water
4453,"KFC, Skin and Breading, EXTRA CRISPY, Fried Ch...",100 g,464,37g,7.5g,59mg,828.00 mg,0,0,0,...,36.61 g,7.541 g,11.816 g,14.238 g,59.00 mg,0,2.92 g,0,0,26.98 g


## 76. DataFrame Axes

In [69]:
nutrition.head()

Unnamed: 0,name,serving_size,calories,total_fat,saturated_fat,cholesterol,sodium,choline,folate,folic_acid,...,fat,saturated_fatty_acids,monounsaturated_fatty_acids,polyunsaturated_fatty_acids,fatty_acids_total_trans,alcohol,ash,caffeine,theobromine,water
0,Cornstarch,100 g,381,0.1g,,0,9.00 mg,0.4 mg,0.00 mcg,0.00 mcg,...,0.05 g,0.009 g,0.016 g,0.025 g,0.00 mg,0.0 g,0.09 g,0.00 mg,0.00 mg,8.32 g
1,"Nuts, pecans",100 g,691,72g,6.2g,0,0.00 mg,40.5 mg,22.00 mcg,0.00 mcg,...,71.97 g,6.180 g,40.801 g,21.614 g,0.00 mg,0.0 g,1.49 g,0.00 mg,0.00 mg,3.52 g
2,"Eggplant, raw",100 g,25,0.2g,,0,2.00 mg,6.9 mg,22.00 mcg,0.00 mcg,...,0.18 g,0.034 g,0.016 g,0.076 g,0.00 mg,0.0 g,0.66 g,0.00 mg,0.00 mg,92.30 g
3,"Teff, uncooked",100 g,367,2.4g,0.4g,0,12.00 mg,13.1 mg,0,0,...,2.38 g,0.449 g,0.589 g,1.071 g,0,0,2.37 g,0,0,8.82 g
4,"Sherbet, orange",100 g,144,2g,1.2g,1mg,46.00 mg,7.7 mg,4.00 mcg,0.00 mcg,...,2.00 g,1.160 g,0.530 g,0.080 g,1.00 mg,0.0 g,0.40 g,0.00 mg,0.00 mg,66.10 g


In [70]:
nutrition.axes

[Index([   0,    1,    2,    3,    4,    5,    6,    7,    8,    9,
        ...
        8779, 8780, 8781, 8782, 8783, 8784, 8785, 8786, 8787, 8788],
       dtype='int64', length=8789),
 Index(['name', 'serving_size', 'calories', 'total_fat', 'saturated_fat',
        'cholesterol', 'sodium', 'choline', 'folate', 'folic_acid', 'niacin',
        'pantothenic_acid', 'riboflavin', 'thiamin', 'vitamin_a',
        'vitamin_a_rae', 'carotene_alpha', 'carotene_beta',
        'cryptoxanthin_beta', 'lutein_zeaxanthin', 'lucopene', 'vitamin_b12',
        'vitamin_b6', 'vitamin_c', 'vitamin_d', 'vitamin_e', 'tocopherol_alpha',
        'vitamin_k', 'calcium', 'copper', 'irom', 'magnesium', 'manganese',
        'phosphorous', 'potassium', 'selenium', 'zink', 'protein', 'alanine',
        'arginine', 'aspartic_acid', 'cystine', 'glutamic_acid', 'glycine',
        'histidine', 'hydroxyproline', 'isoleucine', 'leucine', 'lysine',
        'methionine', 'phenylalanine', 'proline', 'serine', 'threonine',
 

In [71]:
nutrition.axes[0]

Index([   0,    1,    2,    3,    4,    5,    6,    7,    8,    9,
       ...
       8779, 8780, 8781, 8782, 8783, 8784, 8785, 8786, 8787, 8788],
      dtype='int64', length=8789)

In [72]:
nutrition.axes[0][3]

3

In [73]:
nutrition.index[3]

3

In [74]:
nutrition.axes[1][69]

'polyunsaturated_fatty_acids'

In [75]:
nutrition.columns[69]

'polyunsaturated_fatty_acids'

In [76]:
# nutrition.dropna(axis=0)

In [77]:
# 0 = rows
# 1 = columns

In [78]:
nutrition.axes[0]

Index([   0,    1,    2,    3,    4,    5,    6,    7,    8,    9,
       ...
       8779, 8780, 8781, 8782, 8783, 8784, 8785, 8786, 8787, 8788],
      dtype='int64', length=8789)

In [79]:
nutrition.axes[1]

Index(['name', 'serving_size', 'calories', 'total_fat', 'saturated_fat',
       'cholesterol', 'sodium', 'choline', 'folate', 'folic_acid', 'niacin',
       'pantothenic_acid', 'riboflavin', 'thiamin', 'vitamin_a',
       'vitamin_a_rae', 'carotene_alpha', 'carotene_beta',
       'cryptoxanthin_beta', 'lutein_zeaxanthin', 'lucopene', 'vitamin_b12',
       'vitamin_b6', 'vitamin_c', 'vitamin_d', 'vitamin_e', 'tocopherol_alpha',
       'vitamin_k', 'calcium', 'copper', 'irom', 'magnesium', 'manganese',
       'phosphorous', 'potassium', 'selenium', 'zink', 'protein', 'alanine',
       'arginine', 'aspartic_acid', 'cystine', 'glutamic_acid', 'glycine',
       'histidine', 'hydroxyproline', 'isoleucine', 'leucine', 'lysine',
       'methionine', 'phenylalanine', 'proline', 'serine', 'threonine',
       'tryptophan', 'tyrosine', 'valine', 'carbohydrate', 'fiber', 'sugars',
       'fructose', 'galactose', 'glucose', 'lactose', 'maltose', 'sucrose',
       'fat', 'saturated_fatty_acids', 'mon

## 77. Changing The Index

In [81]:
nutrition.index

Index([   0,    1,    2,    3,    4,    5,    6,    7,    8,    9,
       ...
       8779, 8780, 8781, 8782, 8783, 8784, 8785, 8786, 8787, 8788],
      dtype='int64', length=8789)

In [82]:
type(nutrition.index)

pandas.core.indexes.base.Index

In [83]:
nutrition.index = pd.RangeIndex(start=0, stop=8789, step=1)

In [84]:
type(nutrition.index)

pandas.core.indexes.range.RangeIndex

In [85]:
# nutrition.set_index('name',inplace=True)

In [86]:
# nutrition.set_index('folic_acid', drop=True) #True is default

In [87]:
nutrition.set_index('folic_acid', drop=False) #True is default

Unnamed: 0_level_0,name,serving_size,calories,total_fat,saturated_fat,cholesterol,sodium,choline,folate,folic_acid,...,fat,saturated_fatty_acids,monounsaturated_fatty_acids,polyunsaturated_fatty_acids,fatty_acids_total_trans,alcohol,ash,caffeine,theobromine,water
folic_acid,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
0.00 mcg,Cornstarch,100 g,381,0.1g,,0,9.00 mg,0.4 mg,0.00 mcg,0.00 mcg,...,0.05 g,0.009 g,0.016 g,0.025 g,0.00 mg,0.0 g,0.09 g,0.00 mg,0.00 mg,8.32 g
0.00 mcg,"Nuts, pecans",100 g,691,72g,6.2g,0,0.00 mg,40.5 mg,22.00 mcg,0.00 mcg,...,71.97 g,6.180 g,40.801 g,21.614 g,0.00 mg,0.0 g,1.49 g,0.00 mg,0.00 mg,3.52 g
0.00 mcg,"Eggplant, raw",100 g,25,0.2g,,0,2.00 mg,6.9 mg,22.00 mcg,0.00 mcg,...,0.18 g,0.034 g,0.016 g,0.076 g,0.00 mg,0.0 g,0.66 g,0.00 mg,0.00 mg,92.30 g
0,"Teff, uncooked",100 g,367,2.4g,0.4g,0,12.00 mg,13.1 mg,0,0,...,2.38 g,0.449 g,0.589 g,1.071 g,0,0,2.37 g,0,0,8.82 g
0.00 mcg,"Sherbet, orange",100 g,144,2g,1.2g,1mg,46.00 mg,7.7 mg,4.00 mcg,0.00 mcg,...,2.00 g,1.160 g,0.530 g,0.080 g,1.00 mg,0.0 g,0.40 g,0.00 mg,0.00 mg,66.10 g
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
0.00 mcg,"Beef, raw, all grades, trimmed to 0"" fat, sepa...",100 g,125,3.5g,1.4g,62mg,54.00 mg,64.5 mg,4.00 mcg,0.00 mcg,...,3.50 g,1.353 g,1.554 g,0.244 g,62.00 mg,0.0 g,1.11 g,0.00 mg,0.00 mg,72.51 g
0.00 mcg,"Lamb, cooked, separable lean only, composite o...",100 g,206,8.9g,3.9g,109mg,50.00 mg,0,0.00 mcg,0.00 mcg,...,8.86 g,3.860 g,3.480 g,0.520 g,109.00 mg,0,1.60 g,0,0,59.95 g
0.00 mcg,"Lamb, raw, separable lean and fat, composite o...",100 g,277,23g,12g,78mg,39.00 mg,0,1.00 mcg,0.00 mcg,...,22.74 g,11.570 g,8.720 g,0.980 g,78.00 mg,0,0.92 g,0,0,59.80 g
0.00 mcg,"Beef, raw, all grades, trimmed to 0"" fat, sepa...",100 g,121,3g,1.1g,60mg,53.00 mg,64.2 mg,4.00 mcg,0.00 mcg,...,3.04 g,1.086 g,1.266 g,0.233 g,60.00 mg,0.0 g,1.10 g,0.00 mg,0.00 mg,73.43 g


In [88]:
nutrition.set_index('folic_acid', drop=False, append=True, verify_integrity=True).head() #True is default

Unnamed: 0_level_0,Unnamed: 1_level_0,name,serving_size,calories,total_fat,saturated_fat,cholesterol,sodium,choline,folate,folic_acid,...,fat,saturated_fatty_acids,monounsaturated_fatty_acids,polyunsaturated_fatty_acids,fatty_acids_total_trans,alcohol,ash,caffeine,theobromine,water
Unnamed: 0_level_1,folic_acid,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1,Unnamed: 22_level_1
0,0.00 mcg,Cornstarch,100 g,381,0.1g,,0,9.00 mg,0.4 mg,0.00 mcg,0.00 mcg,...,0.05 g,0.009 g,0.016 g,0.025 g,0.00 mg,0.0 g,0.09 g,0.00 mg,0.00 mg,8.32 g
1,0.00 mcg,"Nuts, pecans",100 g,691,72g,6.2g,0,0.00 mg,40.5 mg,22.00 mcg,0.00 mcg,...,71.97 g,6.180 g,40.801 g,21.614 g,0.00 mg,0.0 g,1.49 g,0.00 mg,0.00 mg,3.52 g
2,0.00 mcg,"Eggplant, raw",100 g,25,0.2g,,0,2.00 mg,6.9 mg,22.00 mcg,0.00 mcg,...,0.18 g,0.034 g,0.016 g,0.076 g,0.00 mg,0.0 g,0.66 g,0.00 mg,0.00 mg,92.30 g
3,0,"Teff, uncooked",100 g,367,2.4g,0.4g,0,12.00 mg,13.1 mg,0,0,...,2.38 g,0.449 g,0.589 g,1.071 g,0,0,2.37 g,0,0,8.82 g
4,0.00 mcg,"Sherbet, orange",100 g,144,2g,1.2g,1mg,46.00 mg,7.7 mg,4.00 mcg,0.00 mcg,...,2.00 g,1.160 g,0.530 g,0.080 g,1.00 mg,0.0 g,0.40 g,0.00 mg,0.00 mg,66.10 g


In [89]:
nutrition.calories.value_counts()

calories
884    78
47     45
56     43
0      39
50     38
       ..
549     1
643     1
556     1
584     1
605     1
Name: count, Length: 671, dtype: int64

In [90]:
#nutrition.set_index('calories', verify_integrity=True) 
#This will fail as we have duplicated calories

## 78. Extracting From DataFrames By Label

In [92]:
nutrition.head()

Unnamed: 0,name,serving_size,calories,total_fat,saturated_fat,cholesterol,sodium,choline,folate,folic_acid,...,fat,saturated_fatty_acids,monounsaturated_fatty_acids,polyunsaturated_fatty_acids,fatty_acids_total_trans,alcohol,ash,caffeine,theobromine,water
0,Cornstarch,100 g,381,0.1g,,0,9.00 mg,0.4 mg,0.00 mcg,0.00 mcg,...,0.05 g,0.009 g,0.016 g,0.025 g,0.00 mg,0.0 g,0.09 g,0.00 mg,0.00 mg,8.32 g
1,"Nuts, pecans",100 g,691,72g,6.2g,0,0.00 mg,40.5 mg,22.00 mcg,0.00 mcg,...,71.97 g,6.180 g,40.801 g,21.614 g,0.00 mg,0.0 g,1.49 g,0.00 mg,0.00 mg,3.52 g
2,"Eggplant, raw",100 g,25,0.2g,,0,2.00 mg,6.9 mg,22.00 mcg,0.00 mcg,...,0.18 g,0.034 g,0.016 g,0.076 g,0.00 mg,0.0 g,0.66 g,0.00 mg,0.00 mg,92.30 g
3,"Teff, uncooked",100 g,367,2.4g,0.4g,0,12.00 mg,13.1 mg,0,0,...,2.38 g,0.449 g,0.589 g,1.071 g,0,0,2.37 g,0,0,8.82 g
4,"Sherbet, orange",100 g,144,2g,1.2g,1mg,46.00 mg,7.7 mg,4.00 mcg,0.00 mcg,...,2.00 g,1.160 g,0.530 g,0.080 g,1.00 mg,0.0 g,0.40 g,0.00 mg,0.00 mg,66.10 g


In [93]:
nutrition.set_index('name',inplace=True)

In [94]:
nutrition.head()

Unnamed: 0_level_0,serving_size,calories,total_fat,saturated_fat,cholesterol,sodium,choline,folate,folic_acid,niacin,...,fat,saturated_fatty_acids,monounsaturated_fatty_acids,polyunsaturated_fatty_acids,fatty_acids_total_trans,alcohol,ash,caffeine,theobromine,water
name,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
Cornstarch,100 g,381,0.1g,,0,9.00 mg,0.4 mg,0.00 mcg,0.00 mcg,0.000 mg,...,0.05 g,0.009 g,0.016 g,0.025 g,0.00 mg,0.0 g,0.09 g,0.00 mg,0.00 mg,8.32 g
"Nuts, pecans",100 g,691,72g,6.2g,0,0.00 mg,40.5 mg,22.00 mcg,0.00 mcg,1.167 mg,...,71.97 g,6.180 g,40.801 g,21.614 g,0.00 mg,0.0 g,1.49 g,0.00 mg,0.00 mg,3.52 g
"Eggplant, raw",100 g,25,0.2g,,0,2.00 mg,6.9 mg,22.00 mcg,0.00 mcg,0.649 mg,...,0.18 g,0.034 g,0.016 g,0.076 g,0.00 mg,0.0 g,0.66 g,0.00 mg,0.00 mg,92.30 g
"Teff, uncooked",100 g,367,2.4g,0.4g,0,12.00 mg,13.1 mg,0,0,3.363 mg,...,2.38 g,0.449 g,0.589 g,1.071 g,0,0,2.37 g,0,0,8.82 g
"Sherbet, orange",100 g,144,2g,1.2g,1mg,46.00 mg,7.7 mg,4.00 mcg,0.00 mcg,0.063 mg,...,2.00 g,1.160 g,0.530 g,0.080 g,1.00 mg,0.0 g,0.40 g,0.00 mg,0.00 mg,66.10 g


In [95]:
nutrition.loc['Eggplant, raw']

serving_size       100 g
calories              25
total_fat           0.2g
saturated_fat        NaN
cholesterol            0
                  ...   
alcohol            0.0 g
ash               0.66 g
caffeine         0.00 mg
theobromine      0.00 mg
water            92.30 g
Name: Eggplant, raw, Length: 75, dtype: object

In [96]:
nutrition.loc['Eggplant, raw']['calories']

25

In [97]:
nutrition.loc['Eggplant, raw','calories']

25

In [98]:
nutrition.loc['Eggplant, raw':'Sherbet, orange','calories':'cholesterol']

Unnamed: 0_level_0,calories,total_fat,saturated_fat,cholesterol
name,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1
"Eggplant, raw",25,0.2g,,0
"Teff, uncooked",367,2.4g,0.4g,0
"Sherbet, orange",144,2g,1.2g,1mg


In [99]:
nutrition.loc[
['Raspberries, raw','Blackberries, raw'],
['protein','vitamin_b6']
]

Unnamed: 0_level_0,protein,vitamin_b6
name,Unnamed: 1_level_1,Unnamed: 2_level_1
"Raspberries, raw",1.20 g,0.055 mg
"Blackberries, raw",1.39 g,0.030 mg


## 79. DataFrame Extraction by Position

In [101]:
nutrition.head()

Unnamed: 0_level_0,serving_size,calories,total_fat,saturated_fat,cholesterol,sodium,choline,folate,folic_acid,niacin,...,fat,saturated_fatty_acids,monounsaturated_fatty_acids,polyunsaturated_fatty_acids,fatty_acids_total_trans,alcohol,ash,caffeine,theobromine,water
name,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
Cornstarch,100 g,381,0.1g,,0,9.00 mg,0.4 mg,0.00 mcg,0.00 mcg,0.000 mg,...,0.05 g,0.009 g,0.016 g,0.025 g,0.00 mg,0.0 g,0.09 g,0.00 mg,0.00 mg,8.32 g
"Nuts, pecans",100 g,691,72g,6.2g,0,0.00 mg,40.5 mg,22.00 mcg,0.00 mcg,1.167 mg,...,71.97 g,6.180 g,40.801 g,21.614 g,0.00 mg,0.0 g,1.49 g,0.00 mg,0.00 mg,3.52 g
"Eggplant, raw",100 g,25,0.2g,,0,2.00 mg,6.9 mg,22.00 mcg,0.00 mcg,0.649 mg,...,0.18 g,0.034 g,0.016 g,0.076 g,0.00 mg,0.0 g,0.66 g,0.00 mg,0.00 mg,92.30 g
"Teff, uncooked",100 g,367,2.4g,0.4g,0,12.00 mg,13.1 mg,0,0,3.363 mg,...,2.38 g,0.449 g,0.589 g,1.071 g,0,0,2.37 g,0,0,8.82 g
"Sherbet, orange",100 g,144,2g,1.2g,1mg,46.00 mg,7.7 mg,4.00 mcg,0.00 mcg,0.063 mg,...,2.00 g,1.160 g,0.530 g,0.080 g,1.00 mg,0.0 g,0.40 g,0.00 mg,0.00 mg,66.10 g


In [102]:
nutrition.iloc[3]

serving_size      100 g
calories            367
total_fat          2.4g
saturated_fat      0.4g
cholesterol           0
                  ...  
alcohol               0
ash              2.37 g
caffeine              0
theobromine           0
water            8.82 g
Name: Teff, uncooked, Length: 75, dtype: object

In [103]:
nutrition.iloc[3,:]

serving_size      100 g
calories            367
total_fat          2.4g
saturated_fat      0.4g
cholesterol           0
                  ...  
alcohol               0
ash              2.37 g
caffeine              0
theobromine           0
water            8.82 g
Name: Teff, uncooked, Length: 75, dtype: object

In [104]:
nutrition.iloc[[4,6,9],:]

Unnamed: 0_level_0,serving_size,calories,total_fat,saturated_fat,cholesterol,sodium,choline,folate,folic_acid,niacin,...,fat,saturated_fatty_acids,monounsaturated_fatty_acids,polyunsaturated_fatty_acids,fatty_acids_total_trans,alcohol,ash,caffeine,theobromine,water
name,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
"Sherbet, orange",100 g,144,2g,1.2g,1mg,46.00 mg,7.7 mg,4.00 mcg,0.00 mcg,0.063 mg,...,2.00 g,1.160 g,0.530 g,0.080 g,1.00 mg,0.0 g,0.40 g,0.00 mg,0.00 mg,66.10 g
"Taro leaves, raw",100 g,42,0.7g,0.2g,0,3.00 mg,12.8 mg,126.00 mcg,0.00 mcg,1.513 mg,...,0.74 g,0.151 g,0.060 g,0.307 g,0.00 mg,0.0 g,1.92 g,0.00 mg,0.00 mg,85.66 g
Vegetarian fillets,100 g,290,18g,2.8g,0,490.00 mg,82.0 mg,102.00 mcg,0.00 mcg,12.000 mg,...,18.00 g,2.849 g,4.376 g,9.332 g,0.00 mg,0.0 g,5.00 g,0.00 mg,0.00 mg,45.00 g


In [105]:
nutrition.iloc[[4,6,9]]

Unnamed: 0_level_0,serving_size,calories,total_fat,saturated_fat,cholesterol,sodium,choline,folate,folic_acid,niacin,...,fat,saturated_fatty_acids,monounsaturated_fatty_acids,polyunsaturated_fatty_acids,fatty_acids_total_trans,alcohol,ash,caffeine,theobromine,water
name,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
"Sherbet, orange",100 g,144,2g,1.2g,1mg,46.00 mg,7.7 mg,4.00 mcg,0.00 mcg,0.063 mg,...,2.00 g,1.160 g,0.530 g,0.080 g,1.00 mg,0.0 g,0.40 g,0.00 mg,0.00 mg,66.10 g
"Taro leaves, raw",100 g,42,0.7g,0.2g,0,3.00 mg,12.8 mg,126.00 mcg,0.00 mcg,1.513 mg,...,0.74 g,0.151 g,0.060 g,0.307 g,0.00 mg,0.0 g,1.92 g,0.00 mg,0.00 mg,85.66 g
Vegetarian fillets,100 g,290,18g,2.8g,0,490.00 mg,82.0 mg,102.00 mcg,0.00 mcg,12.000 mg,...,18.00 g,2.849 g,4.376 g,9.332 g,0.00 mg,0.0 g,5.00 g,0.00 mg,0.00 mg,45.00 g


In [106]:
# nutrition.iloc[[4,6,9],'total_fat']

In [107]:
nutrition.iloc[[4,6,9],2]

name
Sherbet, orange         2g
Taro leaves, raw      0.7g
Vegetarian fillets     18g
Name: total_fat, dtype: object

In [108]:
nutrition.iloc[[4,6,9],2:5]

Unnamed: 0_level_0,total_fat,saturated_fat,cholesterol
name,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1
"Sherbet, orange",2g,1.2g,1mg
"Taro leaves, raw",0.7g,0.2g,0
Vegetarian fillets,18g,2.8g,0


In [109]:
new_nutr = nutrition.iloc[
[True if i%2==0 else False for i in range(8789)],
[True if i%2==0 else False for i in range(75)]
]

In [110]:
nutrition.shape #x rows and y columns

(8789, 75)

In [111]:
new_nutr.shape #x/2 rows and y/2 columns

(4395, 38)

In [112]:
nutrition.iloc[9,1]

290

## 80. Single Value Access With .at And .iat

In [114]:
nutrition.loc['Nuts, pecans','calories']

691

In [115]:
nutrition.iloc[1,1]

691

In [116]:
nutrition.at['Nuts, pecans','calories']

691

In [117]:
nutrition.iat[1,1]

691

In [118]:
%timeit nutrition.loc['Nuts, pecans','calories']

10.2 μs ± 1.49 μs per loop (mean ± std. dev. of 7 runs, 100,000 loops each)


In [119]:
%timeit nutrition.at['Nuts, pecans','calories']

3.14 μs ± 258 ns per loop (mean ± std. dev. of 7 runs, 100,000 loops each)


## 81. BONUS - The get_loc() Method

In [121]:
index_label = nutrition.index[2]

In [122]:
column_label = 'vitamin_k'

In [123]:
nutrition.loc[index_label, column_label]

'3.5 mcg'

In [124]:
nutrition.at[index_label, column_label]

'3.5 mcg'

In [125]:
nutrition.columns

Index(['serving_size', 'calories', 'total_fat', 'saturated_fat', 'cholesterol',
       'sodium', 'choline', 'folate', 'folic_acid', 'niacin',
       'pantothenic_acid', 'riboflavin', 'thiamin', 'vitamin_a',
       'vitamin_a_rae', 'carotene_alpha', 'carotene_beta',
       'cryptoxanthin_beta', 'lutein_zeaxanthin', 'lucopene', 'vitamin_b12',
       'vitamin_b6', 'vitamin_c', 'vitamin_d', 'vitamin_e', 'tocopherol_alpha',
       'vitamin_k', 'calcium', 'copper', 'irom', 'magnesium', 'manganese',
       'phosphorous', 'potassium', 'selenium', 'zink', 'protein', 'alanine',
       'arginine', 'aspartic_acid', 'cystine', 'glutamic_acid', 'glycine',
       'histidine', 'hydroxyproline', 'isoleucine', 'leucine', 'lysine',
       'methionine', 'phenylalanine', 'proline', 'serine', 'threonine',
       'tryptophan', 'tyrosine', 'valine', 'carbohydrate', 'fiber', 'sugars',
       'fructose', 'galactose', 'glucose', 'lactose', 'maltose', 'sucrose',
       'fat', 'saturated_fatty_acids', 'monounsatur

In [126]:
nutrition.columns.get_loc('vitamin_k')

26

In [127]:
column_loc = 26
index_loc = 2

In [128]:
nutrition.iloc[index_loc, column_loc]

'3.5 mcg'

In [129]:
nutrition.iat[index_loc, column_loc]

'3.5 mcg'

## 82. Skill Challenge

## 83. Solution

In [132]:
nutr_mini = nutrition.sample(10)
nutr_mini

Unnamed: 0_level_0,serving_size,calories,total_fat,saturated_fat,cholesterol,sodium,choline,folate,folic_acid,niacin,...,fat,saturated_fatty_acids,monounsaturated_fatty_acids,polyunsaturated_fatty_acids,fatty_acids_total_trans,alcohol,ash,caffeine,theobromine,water
name,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
"Cereals ready-to-eat, RAISIN BRAN CRUNCH, KELLOGG'S, KELLOGG",100 g,354,1.8g,0.4g,0,358.00 mg,18.7 mg,189.00 mcg,170.00 mcg,9.390 mg,...,1.79 g,0.400 g,0.300 g,0.690 g,0.00 mg,0.0 g,1.70 g,0.00 mg,0.00 mg,5.00 g
"Cereals ready-to-eat, QUAKER Honey Graham LIFE Cereal, QUAKER",100 g,373,4.1g,0.8g,0,488.00 mg,0,1311.00 mcg,0,18.416 mg,...,4.14 g,0.770 g,1.401 g,1.335 g,0.00 mg,0,3.67 g,0,0,4.30 g
"Soup, dry, beef flavor, ramen noodle",100 g,441,18g,8.2g,0,1727.00 mg,5.3 mg,111.00 mcg,0,5.139 mg,...,17.73 g,8.158 g,6.189 g,2.191 g,0,0,5.31 g,0,0,6.56 g
"Beef, raw, kidneys, variety meats and by-products",100 g,99,3.1g,0.9g,411mg,182.00 mg,0,98.00 mcg,0.00 mcg,8.030 mg,...,3.09 g,0.868 g,0.586 g,0.545 g,411.00 mg,0.0 g,1.33 g,0.00 mg,0.00 mg,77.89 g
"Candies, TWIZZLERS NIBS CHERRY BITS",100 g,347,2.6g,0.5g,0,195.00 mg,0,0,0,0,...,2.64 g,0.540 g,1.880 g,0.140 g,0.00 mg,0,0.57 g,0,0,15.00 g
"Puddings, prepared with whole milk, dry mix, tapioca",100 g,115,2.9g,1.7g,12mg,120.00 mg,0,4.00 mcg,0.00 mcg,0.073 mg,...,2.89 g,1.724 g,0.786 g,0.107 g,12.00 mg,0.0 g,0.85 g,0.00 mg,0.00 mg,73.97 g
"Beverages, non-carbonated, bottled, water, DASANI, The COCA-COLA company",100 g,0,0g,,0,0,0,0,0,0,...,0.00 g,0,0,0,0,0,0.00 g,0,0,99.96 g
"Grapes, raw, muscadine",100 g,57,0.5g,,0,1.00 mg,0,2.00 mcg,0,0,...,0.47 g,0,0,0,0,0,0.50 g,0,0,84.29 g
"Babyfood, arrowroot, cookies",100 g,424,10g,1g,0,319.00 mg,0,35.00 mcg,25.00 mcg,5.739 mg,...,10.00 g,1.048 g,7.922 g,0.591 g,0.00 mg,0,1.40 g,0,0,5.60 g
"Danish pastry, enriched, cinnamon",100 g,403,22g,5.7g,21mg,414.00 mg,21.8 mg,68.00 mcg,35.00 mcg,2.867 mg,...,22.40 g,5.681 g,12.515 g,2.933 g,21.00 mg,0.0 g,1.70 g,0.00 mg,0.00 mg,24.30 g


In [133]:
nutr_mini.shape

(10, 75)

In [134]:
nutr_mini.loc[:,['total_fat','cholesterol']]

Unnamed: 0_level_0,total_fat,cholesterol
name,Unnamed: 1_level_1,Unnamed: 2_level_1
"Cereals ready-to-eat, RAISIN BRAN CRUNCH, KELLOGG'S, KELLOGG",1.8g,0
"Cereals ready-to-eat, QUAKER Honey Graham LIFE Cereal, QUAKER",4.1g,0
"Soup, dry, beef flavor, ramen noodle",18g,0
"Beef, raw, kidneys, variety meats and by-products",3.1g,411mg
"Candies, TWIZZLERS NIBS CHERRY BITS",2.6g,0
"Puddings, prepared with whole milk, dry mix, tapioca",2.9g,12mg
"Beverages, non-carbonated, bottled, water, DASANI, The COCA-COLA company",0g,0
"Grapes, raw, muscadine",0.5g,0
"Babyfood, arrowroot, cookies",10g,0
"Danish pastry, enriched, cinnamon",22g,21mg


In [135]:
nutr_mini_b12_loc = nutr_mini.columns.get_loc('vitamin_b12')

In [136]:
nutr_mini.iloc[0:3,nutr_mini_b12_loc:]

Unnamed: 0_level_0,vitamin_b12,vitamin_b6,vitamin_c,vitamin_d,vitamin_e,tocopherol_alpha,vitamin_k,calcium,copper,irom,...,fat,saturated_fatty_acids,monounsaturated_fatty_acids,polyunsaturated_fatty_acids,fatty_acids_total_trans,alcohol,ash,caffeine,theobromine,water
name,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
"Cereals ready-to-eat, RAISIN BRAN CRUNCH, KELLOGG'S, KELLOGG",2.79 mcg,0.930 mg,2.0 mg,75.00 IU,0.44 mg,0.44 mg,1.5 mcg,35.00 mg,0.361 mg,8.50 mg,...,1.79 g,0.400 g,0.300 g,0.690 g,0.00 mg,0.0 g,1.70 g,0.00 mg,0.00 mg,5.00 g
"Cereals ready-to-eat, QUAKER Honey Graham LIFE Cereal, QUAKER",0.00 mcg,1.842 mg,0.0 mg,0,0.57 mg,0.57 mg,0,366.00 mg,0,29.73 mg,...,4.14 g,0.770 g,1.401 g,1.335 g,0.00 mg,0,3.67 g,0,0,4.30 g
"Soup, dry, beef flavor, ramen noodle",0,0.037 mg,0.6 mg,0,2.49 mg,2.49 mg,9.0 mcg,21.00 mg,0.122 mg,3.93 mg,...,17.73 g,8.158 g,6.189 g,2.191 g,0,0,5.31 g,0,0,6.56 g


In [137]:
nutr_mini.iat[2,1]

441

In [138]:
#nutr_mini.at['Beef, broiled, cooked, all grades, trimmed to 0" fat, separable lean and fat, small end (ribs 10-12), rib eye','calories']

In [139]:
nutr_mini

Unnamed: 0_level_0,serving_size,calories,total_fat,saturated_fat,cholesterol,sodium,choline,folate,folic_acid,niacin,...,fat,saturated_fatty_acids,monounsaturated_fatty_acids,polyunsaturated_fatty_acids,fatty_acids_total_trans,alcohol,ash,caffeine,theobromine,water
name,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
"Cereals ready-to-eat, RAISIN BRAN CRUNCH, KELLOGG'S, KELLOGG",100 g,354,1.8g,0.4g,0,358.00 mg,18.7 mg,189.00 mcg,170.00 mcg,9.390 mg,...,1.79 g,0.400 g,0.300 g,0.690 g,0.00 mg,0.0 g,1.70 g,0.00 mg,0.00 mg,5.00 g
"Cereals ready-to-eat, QUAKER Honey Graham LIFE Cereal, QUAKER",100 g,373,4.1g,0.8g,0,488.00 mg,0,1311.00 mcg,0,18.416 mg,...,4.14 g,0.770 g,1.401 g,1.335 g,0.00 mg,0,3.67 g,0,0,4.30 g
"Soup, dry, beef flavor, ramen noodle",100 g,441,18g,8.2g,0,1727.00 mg,5.3 mg,111.00 mcg,0,5.139 mg,...,17.73 g,8.158 g,6.189 g,2.191 g,0,0,5.31 g,0,0,6.56 g
"Beef, raw, kidneys, variety meats and by-products",100 g,99,3.1g,0.9g,411mg,182.00 mg,0,98.00 mcg,0.00 mcg,8.030 mg,...,3.09 g,0.868 g,0.586 g,0.545 g,411.00 mg,0.0 g,1.33 g,0.00 mg,0.00 mg,77.89 g
"Candies, TWIZZLERS NIBS CHERRY BITS",100 g,347,2.6g,0.5g,0,195.00 mg,0,0,0,0,...,2.64 g,0.540 g,1.880 g,0.140 g,0.00 mg,0,0.57 g,0,0,15.00 g
"Puddings, prepared with whole milk, dry mix, tapioca",100 g,115,2.9g,1.7g,12mg,120.00 mg,0,4.00 mcg,0.00 mcg,0.073 mg,...,2.89 g,1.724 g,0.786 g,0.107 g,12.00 mg,0.0 g,0.85 g,0.00 mg,0.00 mg,73.97 g
"Beverages, non-carbonated, bottled, water, DASANI, The COCA-COLA company",100 g,0,0g,,0,0,0,0,0,0,...,0.00 g,0,0,0,0,0,0.00 g,0,0,99.96 g
"Grapes, raw, muscadine",100 g,57,0.5g,,0,1.00 mg,0,2.00 mcg,0,0,...,0.47 g,0,0,0,0,0,0.50 g,0,0,84.29 g
"Babyfood, arrowroot, cookies",100 g,424,10g,1g,0,319.00 mg,0,35.00 mcg,25.00 mcg,5.739 mg,...,10.00 g,1.048 g,7.922 g,0.591 g,0.00 mg,0,1.40 g,0,0,5.60 g
"Danish pastry, enriched, cinnamon",100 g,403,22g,5.7g,21mg,414.00 mg,21.8 mg,68.00 mcg,35.00 mcg,2.867 mg,...,22.40 g,5.681 g,12.515 g,2.933 g,21.00 mg,0.0 g,1.70 g,0.00 mg,0.00 mg,24.30 g


## 84. More Cleanup: Going Numeric

In [141]:
nutrition.head()

Unnamed: 0_level_0,serving_size,calories,total_fat,saturated_fat,cholesterol,sodium,choline,folate,folic_acid,niacin,...,fat,saturated_fatty_acids,monounsaturated_fatty_acids,polyunsaturated_fatty_acids,fatty_acids_total_trans,alcohol,ash,caffeine,theobromine,water
name,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
Cornstarch,100 g,381,0.1g,,0,9.00 mg,0.4 mg,0.00 mcg,0.00 mcg,0.000 mg,...,0.05 g,0.009 g,0.016 g,0.025 g,0.00 mg,0.0 g,0.09 g,0.00 mg,0.00 mg,8.32 g
"Nuts, pecans",100 g,691,72g,6.2g,0,0.00 mg,40.5 mg,22.00 mcg,0.00 mcg,1.167 mg,...,71.97 g,6.180 g,40.801 g,21.614 g,0.00 mg,0.0 g,1.49 g,0.00 mg,0.00 mg,3.52 g
"Eggplant, raw",100 g,25,0.2g,,0,2.00 mg,6.9 mg,22.00 mcg,0.00 mcg,0.649 mg,...,0.18 g,0.034 g,0.016 g,0.076 g,0.00 mg,0.0 g,0.66 g,0.00 mg,0.00 mg,92.30 g
"Teff, uncooked",100 g,367,2.4g,0.4g,0,12.00 mg,13.1 mg,0,0,3.363 mg,...,2.38 g,0.449 g,0.589 g,1.071 g,0,0,2.37 g,0,0,8.82 g
"Sherbet, orange",100 g,144,2g,1.2g,1mg,46.00 mg,7.7 mg,4.00 mcg,0.00 mcg,0.063 mg,...,2.00 g,1.160 g,0.530 g,0.080 g,1.00 mg,0.0 g,0.40 g,0.00 mg,0.00 mg,66.10 g


In [142]:
nutrition.total_fat.head()

name
Cornstarch         0.1g
Nuts, pecans        72g
Eggplant, raw      0.2g
Teff, uncooked     2.4g
Sherbet, orange      2g
Name: total_fat, dtype: object

## 85. The astype() Method

In [144]:
df = pd.DataFrame({
    'age':[21,25,35,25],
    'weight':[70,85,82,25],
    'height':['1.72','1.81','1.79','1.65']})

In [145]:
df

Unnamed: 0,age,weight,height
0,21,70,1.72
1,25,85,1.81
2,35,82,1.79
3,25,25,1.65


In [146]:
df.astype(float)

Unnamed: 0,age,weight,height
0,21.0,70.0,1.72
1,25.0,85.0,1.81
2,35.0,82.0,1.79
3,25.0,25.0,1.65


In [147]:
df.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 4 entries, 0 to 3
Data columns (total 3 columns):
 #   Column  Non-Null Count  Dtype 
---  ------  --------------  ----- 
 0   age     4 non-null      int64 
 1   weight  4 non-null      int64 
 2   height  4 non-null      object
dtypes: int64(2), object(1)
memory usage: 228.0+ bytes


In [148]:
#reassign
df = df.astype(float)
df

Unnamed: 0,age,weight,height
0,21.0,70.0,1.72
1,25.0,85.0,1.81
2,35.0,82.0,1.79
3,25.0,25.0,1.65


In [149]:
df.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 4 entries, 0 to 3
Data columns (total 3 columns):
 #   Column  Non-Null Count  Dtype  
---  ------  --------------  -----  
 0   age     4 non-null      float64
 1   weight  4 non-null      float64
 2   height  4 non-null      float64
dtypes: float64(3)
memory usage: 228.0 bytes


In [150]:
df.astype({'age':int})

Unnamed: 0,age,weight,height
0,21,70.0,1.72
1,25,85.0,1.81
2,35,82.0,1.79
3,25,25.0,1.65


In [151]:
df.astype({'age':np.int16})

Unnamed: 0,age,weight,height
0,21,70.0,1.72
1,25,85.0,1.81
2,35,82.0,1.79
3,25,25.0,1.65


In [152]:
df.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 4 entries, 0 to 3
Data columns (total 3 columns):
 #   Column  Non-Null Count  Dtype  
---  ------  --------------  -----  
 0   age     4 non-null      float64
 1   weight  4 non-null      float64
 2   height  4 non-null      float64
dtypes: float64(3)
memory usage: 228.0 bytes


In [153]:
nutrition.iloc[:4,:]

Unnamed: 0_level_0,serving_size,calories,total_fat,saturated_fat,cholesterol,sodium,choline,folate,folic_acid,niacin,...,fat,saturated_fatty_acids,monounsaturated_fatty_acids,polyunsaturated_fatty_acids,fatty_acids_total_trans,alcohol,ash,caffeine,theobromine,water
name,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
Cornstarch,100 g,381,0.1g,,0,9.00 mg,0.4 mg,0.00 mcg,0.00 mcg,0.000 mg,...,0.05 g,0.009 g,0.016 g,0.025 g,0.00 mg,0.0 g,0.09 g,0.00 mg,0.00 mg,8.32 g
"Nuts, pecans",100 g,691,72g,6.2g,0,0.00 mg,40.5 mg,22.00 mcg,0.00 mcg,1.167 mg,...,71.97 g,6.180 g,40.801 g,21.614 g,0.00 mg,0.0 g,1.49 g,0.00 mg,0.00 mg,3.52 g
"Eggplant, raw",100 g,25,0.2g,,0,2.00 mg,6.9 mg,22.00 mcg,0.00 mcg,0.649 mg,...,0.18 g,0.034 g,0.016 g,0.076 g,0.00 mg,0.0 g,0.66 g,0.00 mg,0.00 mg,92.30 g
"Teff, uncooked",100 g,367,2.4g,0.4g,0,12.00 mg,13.1 mg,0,0,3.363 mg,...,2.38 g,0.449 g,0.589 g,1.071 g,0,0,2.37 g,0,0,8.82 g


In [154]:
# nutrition.iloc[:4,:].astype(float) #wont work

In [155]:
float(714)

714.0

In [156]:
float('714')

714.0

In [157]:
# float('714g')

## 86. DataFrame replace() + A Glimpse At Regex

In [159]:
dfm = nutrition.iloc[:6,:1]
dfm

Unnamed: 0_level_0,serving_size
name,Unnamed: 1_level_1
Cornstarch,100 g
"Nuts, pecans",100 g
"Eggplant, raw",100 g
"Teff, uncooked",100 g
"Sherbet, orange",100 g
"Cauliflower, raw",100 g


In [160]:
dfm.info()

<class 'pandas.core.frame.DataFrame'>
Index: 6 entries, Cornstarch to Cauliflower, raw
Data columns (total 1 columns):
 #   Column        Non-Null Count  Dtype 
---  ------        --------------  ----- 
 0   serving_size  6 non-null      object
dtypes: object(1)
memory usage: 96.0+ bytes


In [161]:
dfm.replace(to_replace='100 g', value=100)

  dfm.replace(to_replace='100 g', value=100)


Unnamed: 0_level_0,serving_size
name,Unnamed: 1_level_1
Cornstarch,100
"Nuts, pecans",100
"Eggplant, raw",100
"Teff, uncooked",100
"Sherbet, orange",100
"Cauliflower, raw",100


In [162]:
#dfm.replace('100 g',100)

In [163]:
dfm.replace('g', '')

Unnamed: 0_level_0,serving_size
name,Unnamed: 1_level_1
Cornstarch,100 g
"Nuts, pecans",100 g
"Eggplant, raw",100 g
"Teff, uncooked",100 g
"Sherbet, orange",100 g
"Cauliflower, raw",100 g


In [164]:
#regex -- regular expressions

In [165]:
dfm.replace('\ g', '', regex=True).astype(int)

  dfm.replace('\ g', '', regex=True).astype(int)


Unnamed: 0_level_0,serving_size
name,Unnamed: 1_level_1
Cornstarch,100
"Nuts, pecans",100
"Eggplant, raw",100
"Teff, uncooked",100
"Sherbet, orange",100
"Cauliflower, raw",100


In [166]:
nutrition.head()

Unnamed: 0_level_0,serving_size,calories,total_fat,saturated_fat,cholesterol,sodium,choline,folate,folic_acid,niacin,...,fat,saturated_fatty_acids,monounsaturated_fatty_acids,polyunsaturated_fatty_acids,fatty_acids_total_trans,alcohol,ash,caffeine,theobromine,water
name,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
Cornstarch,100 g,381,0.1g,,0,9.00 mg,0.4 mg,0.00 mcg,0.00 mcg,0.000 mg,...,0.05 g,0.009 g,0.016 g,0.025 g,0.00 mg,0.0 g,0.09 g,0.00 mg,0.00 mg,8.32 g
"Nuts, pecans",100 g,691,72g,6.2g,0,0.00 mg,40.5 mg,22.00 mcg,0.00 mcg,1.167 mg,...,71.97 g,6.180 g,40.801 g,21.614 g,0.00 mg,0.0 g,1.49 g,0.00 mg,0.00 mg,3.52 g
"Eggplant, raw",100 g,25,0.2g,,0,2.00 mg,6.9 mg,22.00 mcg,0.00 mcg,0.649 mg,...,0.18 g,0.034 g,0.016 g,0.076 g,0.00 mg,0.0 g,0.66 g,0.00 mg,0.00 mg,92.30 g
"Teff, uncooked",100 g,367,2.4g,0.4g,0,12.00 mg,13.1 mg,0,0,3.363 mg,...,2.38 g,0.449 g,0.589 g,1.071 g,0,0,2.37 g,0,0,8.82 g
"Sherbet, orange",100 g,144,2g,1.2g,1mg,46.00 mg,7.7 mg,4.00 mcg,0.00 mcg,0.063 mg,...,2.00 g,1.160 g,0.530 g,0.080 g,1.00 mg,0.0 g,0.40 g,0.00 mg,0.00 mg,66.10 g


## 87. Part I: Collecting The Units

In [168]:
units = nutrition.astype(str).replace('[^a-zA-Z]', '', regex=True)

In [169]:
units.head()

Unnamed: 0_level_0,serving_size,calories,total_fat,saturated_fat,cholesterol,sodium,choline,folate,folic_acid,niacin,...,fat,saturated_fatty_acids,monounsaturated_fatty_acids,polyunsaturated_fatty_acids,fatty_acids_total_trans,alcohol,ash,caffeine,theobromine,water
name,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
Cornstarch,g,,g,,,mg,mg,mcg,mcg,mg,...,g,g,g,g,mg,g,g,mg,mg,g
"Nuts, pecans",g,,g,g,,mg,mg,mcg,mcg,mg,...,g,g,g,g,mg,g,g,mg,mg,g
"Eggplant, raw",g,,g,,,mg,mg,mcg,mcg,mg,...,g,g,g,g,mg,g,g,mg,mg,g
"Teff, uncooked",g,,g,g,,mg,mg,,,mg,...,g,g,g,g,,,g,,,g
"Sherbet, orange",g,,g,g,mg,mg,mg,mcg,mcg,mg,...,g,g,g,g,mg,g,g,mg,mg,g


In [170]:
units.saturated_fat.value_counts()

saturated_fat
g      7199
nan    1590
Name: count, dtype: int64

In [171]:
units.saturated_fat.mode()

0    g
Name: saturated_fat, dtype: object

In [172]:
units.mode()

Unnamed: 0,serving_size,calories,total_fat,saturated_fat,cholesterol,sodium,choline,folate,folic_acid,niacin,...,fat,saturated_fatty_acids,monounsaturated_fatty_acids,polyunsaturated_fatty_acids,fatty_acids_total_trans,alcohol,ash,caffeine,theobromine,water
0,g,,g,g,mg,mg,mg,mcg,mcg,mg,...,g,g,g,g,mg,g,g,mg,mg,g


In [173]:
units = units.mode()

## 88. The rename() Method

In [175]:
nutrition.head()

Unnamed: 0_level_0,serving_size,calories,total_fat,saturated_fat,cholesterol,sodium,choline,folate,folic_acid,niacin,...,fat,saturated_fatty_acids,monounsaturated_fatty_acids,polyunsaturated_fatty_acids,fatty_acids_total_trans,alcohol,ash,caffeine,theobromine,water
name,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
Cornstarch,100 g,381,0.1g,,0,9.00 mg,0.4 mg,0.00 mcg,0.00 mcg,0.000 mg,...,0.05 g,0.009 g,0.016 g,0.025 g,0.00 mg,0.0 g,0.09 g,0.00 mg,0.00 mg,8.32 g
"Nuts, pecans",100 g,691,72g,6.2g,0,0.00 mg,40.5 mg,22.00 mcg,0.00 mcg,1.167 mg,...,71.97 g,6.180 g,40.801 g,21.614 g,0.00 mg,0.0 g,1.49 g,0.00 mg,0.00 mg,3.52 g
"Eggplant, raw",100 g,25,0.2g,,0,2.00 mg,6.9 mg,22.00 mcg,0.00 mcg,0.649 mg,...,0.18 g,0.034 g,0.016 g,0.076 g,0.00 mg,0.0 g,0.66 g,0.00 mg,0.00 mg,92.30 g
"Teff, uncooked",100 g,367,2.4g,0.4g,0,12.00 mg,13.1 mg,0,0,3.363 mg,...,2.38 g,0.449 g,0.589 g,1.071 g,0,0,2.37 g,0,0,8.82 g
"Sherbet, orange",100 g,144,2g,1.2g,1mg,46.00 mg,7.7 mg,4.00 mcg,0.00 mcg,0.063 mg,...,2.00 g,1.160 g,0.530 g,0.080 g,1.00 mg,0.0 g,0.40 g,0.00 mg,0.00 mg,66.10 g


In [176]:
df

Unnamed: 0,age,weight,height
0,21.0,70.0,1.72
1,25.0,85.0,1.81
2,35.0,82.0,1.79
3,25.0,25.0,1.65


In [177]:
df.rename(index={0:'Pikachu'})

Unnamed: 0,age,weight,height
Pikachu,21.0,70.0,1.72
1,25.0,85.0,1.81
2,35.0,82.0,1.79
3,25.0,25.0,1.65


In [178]:
df.rename(index={0:'Pikachu',1:'Nacho'})

Unnamed: 0,age,weight,height
Pikachu,21.0,70.0,1.72
Nacho,25.0,85.0,1.81
2,35.0,82.0,1.79
3,25.0,25.0,1.65


In [179]:
df.rename(columns={'weight':'Weight (kg)'})

Unnamed: 0,age,Weight (kg),height
0,21.0,70.0,1.72
1,25.0,85.0,1.81
2,35.0,82.0,1.79
3,25.0,25.0,1.65


In [180]:
df.rename(index={0:'One'}, columns={'age':'years'}, inplace=False)

Unnamed: 0,years,weight,height
One,21.0,70.0,1.72
1,25.0,85.0,1.81
2,35.0,82.0,1.79
3,25.0,25.0,1.65


In [181]:
df

Unnamed: 0,age,weight,height
0,21.0,70.0,1.72
1,25.0,85.0,1.81
2,35.0,82.0,1.79
3,25.0,25.0,1.65


In [182]:
df.rename(mapper={'age':'years'}, axis=1)

Unnamed: 0,years,weight,height
0,21.0,70.0,1.72
1,25.0,85.0,1.81
2,35.0,82.0,1.79
3,25.0,25.0,1.65


In [183]:
df.axes[1]

Index(['age', 'weight', 'height'], dtype='object')

In [184]:
df.axes[0]

RangeIndex(start=0, stop=4, step=1)

## 89. DataFrame dropna()

In [186]:
df

Unnamed: 0,age,weight,height
0,21.0,70.0,1.72
1,25.0,85.0,1.81
2,35.0,82.0,1.79
3,25.0,25.0,1.65


In [187]:
df.loc[2,'weight'] = np.nan

In [188]:
df

Unnamed: 0,age,weight,height
0,21.0,70.0,1.72
1,25.0,85.0,1.81
2,35.0,,1.79
3,25.0,25.0,1.65


In [189]:
df.loc[1,:] = np.nan

In [190]:
df

Unnamed: 0,age,weight,height
0,21.0,70.0,1.72
1,,,
2,35.0,,1.79
3,25.0,25.0,1.65


In [191]:
df.dropna()

Unnamed: 0,age,weight,height
0,21.0,70.0,1.72
3,25.0,25.0,1.65


In [192]:
df.dropna(how='any', axis=0)

Unnamed: 0,age,weight,height
0,21.0,70.0,1.72
3,25.0,25.0,1.65


In [193]:
df.dropna(how='all', axis=0)

Unnamed: 0,age,weight,height
0,21.0,70.0,1.72
2,35.0,,1.79
3,25.0,25.0,1.65


In [194]:
df.dropna(thresh=3, axis=0)

Unnamed: 0,age,weight,height
0,21.0,70.0,1.72
3,25.0,25.0,1.65


In [195]:
#thresh

In [196]:
df.dropna(thresh=df.shape[1], axis=0)

Unnamed: 0,age,weight,height
0,21.0,70.0,1.72
3,25.0,25.0,1.65


In [197]:
df

Unnamed: 0,age,weight,height
0,21.0,70.0,1.72
1,,,
2,35.0,,1.79
3,25.0,25.0,1.65


In [198]:
df.dropna(axis=1)

0
1
2
3


In [199]:
df.dropna(how='any', axis=1)

0
1
2
3


In [200]:
df.dropna(how='all', axis=1)

Unnamed: 0,age,weight,height
0,21.0,70.0,1.72
1,,,
2,35.0,,1.79
3,25.0,25.0,1.65


In [201]:
df.dropna(axis=1, thresh=3, inplace=True)

In [202]:
df

Unnamed: 0,age,height
0,21.0,1.72
1,,
2,35.0,1.79
3,25.0,1.65


## 90. BONUS - dropna() With Subset

In [204]:
df['gender'] = ['M','F',np.nan,'F']

In [205]:
df

Unnamed: 0,age,height,gender
0,21.0,1.72,M
1,,,F
2,35.0,1.79,
3,25.0,1.65,F


In [206]:
df.dropna()

Unnamed: 0,age,height,gender
0,21.0,1.72,M
3,25.0,1.65,F


In [207]:
df.dropna(how='any', axis=0)

Unnamed: 0,age,height,gender
0,21.0,1.72,M
3,25.0,1.65,F


In [208]:
# the subset paramether

In [209]:
df.dropna(axis=0, how='any', subset=['gender'])

Unnamed: 0,age,height,gender
0,21.0,1.72,M
1,,,F
3,25.0,1.65,F


In [210]:
df.dropna(how='any', axis=1)

0
1
2
3


In [211]:
df.dropna(how='any', axis=1, subset=[0,2])

Unnamed: 0,age,height
0,21.0,1.72
1,,
2,35.0,1.79
3,25.0,1.65


## 91. Part II: Merging Units With Column Names

In [213]:
units

Unnamed: 0,serving_size,calories,total_fat,saturated_fat,cholesterol,sodium,choline,folate,folic_acid,niacin,...,fat,saturated_fatty_acids,monounsaturated_fatty_acids,polyunsaturated_fatty_acids,fatty_acids_total_trans,alcohol,ash,caffeine,theobromine,water
0,g,,g,g,mg,mg,mg,mcg,mcg,mg,...,g,g,g,g,mg,g,g,mg,mg,g


In [214]:
# the rename method

In [215]:
for k in units:
    print(k)

serving_size
calories
total_fat
saturated_fat
cholesterol
sodium
choline
folate
folic_acid
niacin
pantothenic_acid
riboflavin
thiamin
vitamin_a
vitamin_a_rae
carotene_alpha
carotene_beta
cryptoxanthin_beta
lutein_zeaxanthin
lucopene
vitamin_b12
vitamin_b6
vitamin_c
vitamin_d
vitamin_e
tocopherol_alpha
vitamin_k
calcium
copper
irom
magnesium
manganese
phosphorous
potassium
selenium
zink
protein
alanine
arginine
aspartic_acid
cystine
glutamic_acid
glycine
histidine
hydroxyproline
isoleucine
leucine
lysine
methionine
phenylalanine
proline
serine
threonine
tryptophan
tyrosine
valine
carbohydrate
fiber
sugars
fructose
galactose
glucose
lactose
maltose
sucrose
fat
saturated_fatty_acids
monounsaturated_fatty_acids
polyunsaturated_fatty_acids
fatty_acids_total_trans
alcohol
ash
caffeine
theobromine
water


In [216]:
for k in units:
    print(units[k].at[0])

g

g
g
mg
mg
mg
mcg
mcg
mg
mg
mg
mg
IU
mcg
mcg
mcg
mcg
mcg

mcg
mg
mg
IU
mg
mg
mcg
mg
mg
mg
mg
mg
mg
mg
mcg
mg
g
g
g
g
g
g
g
g

g
g
g
g
g
g
g
g
g
g
g
g
g
g






g
g
g
g
mg
g
g
mg
mg
g


In [217]:
units[k]

0    g
Name: water, dtype: object

In [218]:
units = units.replace('', np.nan).dropna(axis=1)

  units = units.replace('', np.nan).dropna(axis=1)


In [219]:
for k in units:
    print(units[k].at[0])

g
g
g
mg
mg
mg
mcg
mcg
mg
mg
mg
mg
IU
mcg
mcg
mcg
mcg
mcg
mcg
mg
mg
IU
mg
mg
mcg
mg
mg
mg
mg
mg
mg
mg
mcg
mg
g
g
g
g
g
g
g
g
g
g
g
g
g
g
g
g
g
g
g
g
g
g
g
g
g
g
mg
g
g
mg
mg
g


In [220]:
mapper = {k:k+"_" + units[k].at[0] for k in units}

In [221]:
mapper

{'serving_size': 'serving_size_g',
 'total_fat': 'total_fat_g',
 'saturated_fat': 'saturated_fat_g',
 'cholesterol': 'cholesterol_mg',
 'sodium': 'sodium_mg',
 'choline': 'choline_mg',
 'folate': 'folate_mcg',
 'folic_acid': 'folic_acid_mcg',
 'niacin': 'niacin_mg',
 'pantothenic_acid': 'pantothenic_acid_mg',
 'riboflavin': 'riboflavin_mg',
 'thiamin': 'thiamin_mg',
 'vitamin_a': 'vitamin_a_IU',
 'vitamin_a_rae': 'vitamin_a_rae_mcg',
 'carotene_alpha': 'carotene_alpha_mcg',
 'carotene_beta': 'carotene_beta_mcg',
 'cryptoxanthin_beta': 'cryptoxanthin_beta_mcg',
 'lutein_zeaxanthin': 'lutein_zeaxanthin_mcg',
 'vitamin_b12': 'vitamin_b12_mcg',
 'vitamin_b6': 'vitamin_b6_mg',
 'vitamin_c': 'vitamin_c_mg',
 'vitamin_d': 'vitamin_d_IU',
 'vitamin_e': 'vitamin_e_mg',
 'tocopherol_alpha': 'tocopherol_alpha_mg',
 'vitamin_k': 'vitamin_k_mcg',
 'calcium': 'calcium_mg',
 'copper': 'copper_mg',
 'irom': 'irom_mg',
 'magnesium': 'magnesium_mg',
 'manganese': 'manganese_mg',
 'phosphorous': 'phospho

In [222]:
nutrition.rename(columns=mapper, inplace=True)

In [223]:
nutrition

Unnamed: 0_level_0,serving_size_g,calories,total_fat_g,saturated_fat_g,cholesterol_mg,sodium_mg,choline_mg,folate_mcg,folic_acid_mcg,niacin_mg,...,fat_g,saturated_fatty_acids_g,monounsaturated_fatty_acids_g,polyunsaturated_fatty_acids_g,fatty_acids_total_trans_mg,alcohol_g,ash_g,caffeine_mg,theobromine_mg,water_g
name,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
Cornstarch,100 g,381,0.1g,,0,9.00 mg,0.4 mg,0.00 mcg,0.00 mcg,0.000 mg,...,0.05 g,0.009 g,0.016 g,0.025 g,0.00 mg,0.0 g,0.09 g,0.00 mg,0.00 mg,8.32 g
"Nuts, pecans",100 g,691,72g,6.2g,0,0.00 mg,40.5 mg,22.00 mcg,0.00 mcg,1.167 mg,...,71.97 g,6.180 g,40.801 g,21.614 g,0.00 mg,0.0 g,1.49 g,0.00 mg,0.00 mg,3.52 g
"Eggplant, raw",100 g,25,0.2g,,0,2.00 mg,6.9 mg,22.00 mcg,0.00 mcg,0.649 mg,...,0.18 g,0.034 g,0.016 g,0.076 g,0.00 mg,0.0 g,0.66 g,0.00 mg,0.00 mg,92.30 g
"Teff, uncooked",100 g,367,2.4g,0.4g,0,12.00 mg,13.1 mg,0,0,3.363 mg,...,2.38 g,0.449 g,0.589 g,1.071 g,0,0,2.37 g,0,0,8.82 g
"Sherbet, orange",100 g,144,2g,1.2g,1mg,46.00 mg,7.7 mg,4.00 mcg,0.00 mcg,0.063 mg,...,2.00 g,1.160 g,0.530 g,0.080 g,1.00 mg,0.0 g,0.40 g,0.00 mg,0.00 mg,66.10 g
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
"Beef, raw, all grades, trimmed to 0"" fat, separable lean and fat, boneless, top round roast, round",100 g,125,3.5g,1.4g,62mg,54.00 mg,64.5 mg,4.00 mcg,0.00 mcg,6.422 mg,...,3.50 g,1.353 g,1.554 g,0.244 g,62.00 mg,0.0 g,1.11 g,0.00 mg,0.00 mg,72.51 g
"Lamb, cooked, separable lean only, composite of trimmed retail cuts, frozen, imported, New Zealand",100 g,206,8.9g,3.9g,109mg,50.00 mg,0,0.00 mcg,0.00 mcg,7.680 mg,...,8.86 g,3.860 g,3.480 g,0.520 g,109.00 mg,0,1.60 g,0,0,59.95 g
"Lamb, raw, separable lean and fat, composite of trimmed retail cuts, frozen, imported, New Zealand",100 g,277,23g,12g,78mg,39.00 mg,0,1.00 mcg,0.00 mcg,6.550 mg,...,22.74 g,11.570 g,8.720 g,0.980 g,78.00 mg,0,0.92 g,0,0,59.80 g
"Beef, raw, all grades, trimmed to 0"" fat, separable lean only, boneless, eye of round roast, round",100 g,121,3g,1.1g,60mg,53.00 mg,64.2 mg,4.00 mcg,0.00 mcg,6.720 mg,...,3.04 g,1.086 g,1.266 g,0.233 g,60.00 mg,0.0 g,1.10 g,0.00 mg,0.00 mg,73.43 g


## 92. Part III: Removing Units From Values

In [225]:
nutrition.head(5)

Unnamed: 0_level_0,serving_size_g,calories,total_fat_g,saturated_fat_g,cholesterol_mg,sodium_mg,choline_mg,folate_mcg,folic_acid_mcg,niacin_mg,...,fat_g,saturated_fatty_acids_g,monounsaturated_fatty_acids_g,polyunsaturated_fatty_acids_g,fatty_acids_total_trans_mg,alcohol_g,ash_g,caffeine_mg,theobromine_mg,water_g
name,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
Cornstarch,100 g,381,0.1g,,0,9.00 mg,0.4 mg,0.00 mcg,0.00 mcg,0.000 mg,...,0.05 g,0.009 g,0.016 g,0.025 g,0.00 mg,0.0 g,0.09 g,0.00 mg,0.00 mg,8.32 g
"Nuts, pecans",100 g,691,72g,6.2g,0,0.00 mg,40.5 mg,22.00 mcg,0.00 mcg,1.167 mg,...,71.97 g,6.180 g,40.801 g,21.614 g,0.00 mg,0.0 g,1.49 g,0.00 mg,0.00 mg,3.52 g
"Eggplant, raw",100 g,25,0.2g,,0,2.00 mg,6.9 mg,22.00 mcg,0.00 mcg,0.649 mg,...,0.18 g,0.034 g,0.016 g,0.076 g,0.00 mg,0.0 g,0.66 g,0.00 mg,0.00 mg,92.30 g
"Teff, uncooked",100 g,367,2.4g,0.4g,0,12.00 mg,13.1 mg,0,0,3.363 mg,...,2.38 g,0.449 g,0.589 g,1.071 g,0,0,2.37 g,0,0,8.82 g
"Sherbet, orange",100 g,144,2g,1.2g,1mg,46.00 mg,7.7 mg,4.00 mcg,0.00 mcg,0.063 mg,...,2.00 g,1.160 g,0.530 g,0.080 g,1.00 mg,0.0 g,0.40 g,0.00 mg,0.00 mg,66.10 g


In [226]:
nutrition.replace('[a-zA-Z]', '', regex=True, inplace=True)

In [227]:
nutrition.head(5)

Unnamed: 0_level_0,serving_size_g,calories,total_fat_g,saturated_fat_g,cholesterol_mg,sodium_mg,choline_mg,folate_mcg,folic_acid_mcg,niacin_mg,...,fat_g,saturated_fatty_acids_g,monounsaturated_fatty_acids_g,polyunsaturated_fatty_acids_g,fatty_acids_total_trans_mg,alcohol_g,ash_g,caffeine_mg,theobromine_mg,water_g
name,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
Cornstarch,100,381,0.1,,0,9.0,0.4,0.0,0.0,0.0,...,0.05,0.009,0.016,0.025,0.0,0.0,0.09,0.0,0.0,8.32
"Nuts, pecans",100,691,72.0,6.2,0,0.0,40.5,22.0,0.0,1.167,...,71.97,6.18,40.801,21.614,0.0,0.0,1.49,0.0,0.0,3.52
"Eggplant, raw",100,25,0.2,,0,2.0,6.9,22.0,0.0,0.649,...,0.18,0.034,0.016,0.076,0.0,0.0,0.66,0.0,0.0,92.3
"Teff, uncooked",100,367,2.4,0.4,0,12.0,13.1,0.0,0.0,3.363,...,2.38,0.449,0.589,1.071,0.0,0.0,2.37,0.0,0.0,8.82
"Sherbet, orange",100,144,2.0,1.2,1,46.0,7.7,4.0,0.0,0.063,...,2.0,1.16,0.53,0.08,1.0,0.0,0.4,0.0,0.0,66.1


In [228]:
nutrition.dtypes

serving_size_g     object
calories            int64
total_fat_g        object
saturated_fat_g    object
cholesterol_mg     object
                    ...  
alcohol_g          object
ash_g              object
caffeine_mg        object
theobromine_mg     object
water_g            object
Length: 75, dtype: object

In [229]:
nutrition.dtypes.value_counts()

object    73
int64      2
Name: count, dtype: int64

In [230]:
nutrition = nutrition.astype(float)

In [231]:
nutrition.dtypes

serving_size_g     float64
calories           float64
total_fat_g        float64
saturated_fat_g    float64
cholesterol_mg     float64
                    ...   
alcohol_g          float64
ash_g              float64
caffeine_mg        float64
theobromine_mg     float64
water_g            float64
Length: 75, dtype: object

In [232]:
nutrition.info(verbose=False)

<class 'pandas.core.frame.DataFrame'>
Index: 8789 entries, Cornstarch to Beef, raw, all grades, trimmed to 0" fat, separable lean only, boneless, eye of round steak, round
Columns: 75 entries, serving_size_g to water_g
dtypes: float64(75)
memory usage: 5.3+ MB


## 93. Filtering in 2D

In [234]:
nutrition.shape

(8789, 75)

In [235]:
nutrition.filter(like='octopus', axis=0) #case sensitive

Unnamed: 0_level_0,serving_size_g,calories,total_fat_g,saturated_fat_g,cholesterol_mg,sodium_mg,choline_mg,folate_mcg,folic_acid_mcg,niacin_mg,...,fat_g,saturated_fatty_acids_g,monounsaturated_fatty_acids_g,polyunsaturated_fatty_acids_g,fatty_acids_total_trans_mg,alcohol_g,ash_g,caffeine_mg,theobromine_mg,water_g
name,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
"Mollusks, raw, common, octopus",100.0,82.0,1.0,0.2,48.0,230.0,65.0,16.0,0.0,2.1,...,1.04,0.227,0.162,0.239,48.0,0.0,1.6,0.0,0.0,80.25
"Mollusks, moist heat, cooked, common, octopus",100.0,164.0,2.1,0.5,96.0,460.0,81.0,24.0,0.0,3.78,...,2.08,0.453,0.324,0.477,96.0,0.0,3.2,0.0,0.0,60.5


In [236]:
nutrition.filter(regex='(?i)octopus', axis=0)

Unnamed: 0_level_0,serving_size_g,calories,total_fat_g,saturated_fat_g,cholesterol_mg,sodium_mg,choline_mg,folate_mcg,folic_acid_mcg,niacin_mg,...,fat_g,saturated_fatty_acids_g,monounsaturated_fatty_acids_g,polyunsaturated_fatty_acids_g,fatty_acids_total_trans_mg,alcohol_g,ash_g,caffeine_mg,theobromine_mg,water_g
name,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
Octopus (Alaska Native),100.0,56.0,0.8,0.2,41.0,0.0,0.0,0.0,0.0,2.0,...,0.8,0.2,0.0,0.2,41.0,0.0,1.5,0.0,0.0,84.0
"Mollusks, raw, common, octopus",100.0,82.0,1.0,0.2,48.0,230.0,65.0,16.0,0.0,2.1,...,1.04,0.227,0.162,0.239,48.0,0.0,1.6,0.0,0.0,80.25
"Mollusks, moist heat, cooked, common, octopus",100.0,164.0,2.1,0.5,96.0,460.0,81.0,24.0,0.0,3.78,...,2.08,0.453,0.324,0.477,96.0,0.0,3.2,0.0,0.0,60.5


In [237]:
nutrition.filter(regex='(?i)octopus', axis=0).filter(items=['cholesterol_mg', 'serving_size_g', 'calories'], axis=1)

Unnamed: 0_level_0,cholesterol_mg,serving_size_g,calories
name,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1
Octopus (Alaska Native),41.0,100.0,56.0
"Mollusks, raw, common, octopus",48.0,100.0,82.0
"Mollusks, moist heat, cooked, common, octopus",96.0,100.0,164.0


## 94. DataFrame Sorting

In [239]:
nutrition.vitamin_b12_mcg.sort_values()

name
Cornstarch                                                                           0.00
Apricots, stewed, sulfured, dehydrated (low-moisture)                                0.00
Cocoa, processed with alkali, unsweetened, dry powder                                0.00
Tomato products, with herbs and cheese, sauce, canned                                0.00
Mothbeans, without salt, boiled, cooked, mature seeds                                0.00
                                                                                    ...  
Veal, braised, cooked, liver, variety meats and by-products                         84.60
Lamb, pan-fried, cooked, liver, variety meats and by-products                       85.70
Lamb, raw, liver, variety meats and by-products                                     90.05
Beef, boiled, cooked, variety meats and by-products liver, imported, New Zealand    96.00
Mollusks, moist heat, cooked, mixed species, clam                                   98.89
Name:

In [240]:
nutrition.sort_values(by=['calories'], ascending=False)

Unnamed: 0_level_0,serving_size_g,calories,total_fat_g,saturated_fat_g,cholesterol_mg,sodium_mg,choline_mg,folate_mcg,folic_acid_mcg,niacin_mg,...,fat_g,saturated_fatty_acids_g,monounsaturated_fatty_acids_g,polyunsaturated_fatty_acids_g,fatty_acids_total_trans_mg,alcohol_g,ash_g,caffeine_mg,theobromine_mg,water_g
name,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
"Fat, mutton tallow",100.0,902.0,100.0,47.0,102.0,0.0,79.8,0.0,0.0,0.00,...,100.0,47.300,40.600,7.800,102.0,0.0,0.00,0.0,0.0,0.00
"Fish oil, salmon",100.0,902.0,100.0,20.0,485.0,0.0,0.0,0.0,0.0,0.00,...,100.0,19.872,29.037,40.324,485.0,0.0,0.00,0.0,0.0,0.00
Lard,100.0,902.0,100.0,39.0,95.0,0.0,49.7,0.0,0.0,0.00,...,100.0,39.200,45.100,11.200,95.0,0.0,0.00,0.0,0.0,0.00
"Fat, beef tallow",100.0,902.0,100.0,50.0,109.0,0.0,79.8,0.0,0.0,0.00,...,100.0,49.800,41.800,4.000,109.0,0.0,0.00,0.0,0.0,0.00
"Fish oil, cod liver",100.0,902.0,100.0,23.0,570.0,0.0,0.0,0.0,0.0,0.00,...,100.0,22.608,46.711,22.541,570.0,0.0,0.00,0.0,0.0,0.00
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
"Beverages, decaffeinated, brewed, green, tea",100.0,0.0,0.0,,0.0,0.0,0.0,0.0,0.0,0.03,...,0.0,0.000,0.000,0.000,0.0,0.0,0.00,0.0,0.0,99.93
"Beverages, caffeine free, cola, ZEVIA",100.0,0.0,0.0,,0.0,6.0,0.0,0.0,0.0,0.00,...,0.0,0.000,0.000,0.000,0.0,0.0,0.01,0.0,0.0,98.87
"Carbonated beverage, without caffeine, with sodium saccharin, other than cola or pepper, low calorie",100.0,0.0,0.0,,0.0,16.0,0.0,0.0,0.0,0.00,...,0.0,0.000,0.000,0.000,0.0,0.0,0.10,0.0,0.0,99.80
"Beverages, unsweetened, ready to drink, green, tea",100.0,0.0,0.0,,0.0,7.0,0.0,0.0,0.0,0.00,...,0.0,0.000,0.000,0.000,0.0,0.0,0.12,12.0,0.0,99.88


In [241]:
nutrition.sort_values(by=['cholesterol_mg','sodium_mg'], ascending=False).head(3)

Unnamed: 0_level_0,serving_size_g,calories,total_fat_g,saturated_fat_g,cholesterol_mg,sodium_mg,choline_mg,folate_mcg,folic_acid_mcg,niacin_mg,...,fat_g,saturated_fatty_acids_g,monounsaturated_fatty_acids_g,polyunsaturated_fatty_acids_g,fatty_acids_total_trans_mg,alcohol_g,ash_g,caffeine_mg,theobromine_mg,water_g
name,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
"Veal, braised, cooked, brain, variety meats and by-products",100.0,136.0,9.6,2.2,3100.0,156.0,0.0,3.0,0.0,2.43,...,9.63,2.18,1.74,1.49,3100.0,0.0,1.4,0.0,0.0,76.89
"Beef, simmered, cooked, brain, variety meats and by-products",100.0,151.0,11.0,2.4,3100.0,108.0,490.9,5.0,0.0,3.62,...,10.53,2.394,1.882,1.632,3100.0,0.0,1.46,0.0,0.0,74.86
"Beef, raw, brain, variety meats and by-products",100.0,143.0,10.0,2.3,3010.0,126.0,0.0,3.0,0.0,3.55,...,10.3,2.3,1.89,1.586,3010.0,0.0,1.51,0.0,0.0,76.29


In [242]:
nutrition.sort_values(by=['cholesterol_mg','sodium_mg'], ascending=[False, True]).head(3)

Unnamed: 0_level_0,serving_size_g,calories,total_fat_g,saturated_fat_g,cholesterol_mg,sodium_mg,choline_mg,folate_mcg,folic_acid_mcg,niacin_mg,...,fat_g,saturated_fatty_acids_g,monounsaturated_fatty_acids_g,polyunsaturated_fatty_acids_g,fatty_acids_total_trans_mg,alcohol_g,ash_g,caffeine_mg,theobromine_mg,water_g
name,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
"Beef, simmered, cooked, brain, variety meats and by-products",100.0,151.0,11.0,2.4,3100.0,108.0,490.9,5.0,0.0,3.62,...,10.53,2.394,1.882,1.632,3100.0,0.0,1.46,0.0,0.0,74.86
"Veal, braised, cooked, brain, variety meats and by-products",100.0,136.0,9.6,2.2,3100.0,156.0,0.0,3.0,0.0,2.43,...,9.63,2.18,1.74,1.49,3100.0,0.0,1.4,0.0,0.0,76.89
"Beef, raw, brain, variety meats and by-products",100.0,143.0,10.0,2.3,3010.0,126.0,0.0,3.0,0.0,3.55,...,10.3,2.3,1.89,1.586,3010.0,0.0,1.51,0.0,0.0,76.29


In [243]:
nutrition.loc['Beef, simmered, cooked, brain, variety meats and by-products'].filter(like='_g').sort_values(ascending=False)

serving_size_g                   100.000
water_g                           74.860
protein_g                         11.670
total_fat_g                       11.000
fat_g                             10.530
saturated_fat_g                    2.400
saturated_fatty_acids_g            2.394
monounsaturated_fatty_acids_g      1.882
polyunsaturated_fatty_acids_g      1.632
carbohydrate_g                     1.480
ash_g                              1.460
threonine_g                        0.000
alcohol_g                          0.000
sugars_g                           0.000
fiber_g                            0.000
valine_g                           0.000
tyrosine_g                         0.000
tryptophan_g                       0.000
serine_g                           0.000
phenylalanine_g                    0.000
methionine_g                       0.000
lysine_g                           0.000
leucine_g                          0.000
isoleucine_g                       0.000
histidine_g     

## 95. Using Series between() With DataFrames

In [245]:
nutrition.calories.head(10)

name
Cornstarch            381.0
Nuts, pecans          691.0
Eggplant, raw          25.0
Teff, uncooked        367.0
Sherbet, orange       144.0
Cauliflower, raw       25.0
Taro leaves, raw       42.0
Lamb, raw, ground     282.0
Cheese, camembert     300.0
Vegetarian fillets    290.0
Name: calories, dtype: float64

In [246]:
nutrition[nutrition.calories.between(20,60)]

Unnamed: 0_level_0,serving_size_g,calories,total_fat_g,saturated_fat_g,cholesterol_mg,sodium_mg,choline_mg,folate_mcg,folic_acid_mcg,niacin_mg,...,fat_g,saturated_fatty_acids_g,monounsaturated_fatty_acids_g,polyunsaturated_fatty_acids_g,fatty_acids_total_trans_mg,alcohol_g,ash_g,caffeine_mg,theobromine_mg,water_g
name,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
"Eggplant, raw",100.0,25.0,0.2,,0.0,2.0,6.9,22.0,0.0,0.649,...,0.18,0.034,0.016,0.076,0.0,0.0,0.66,0.0,0.0,92.30
"Cauliflower, raw",100.0,25.0,0.3,0.1,0.0,30.0,44.3,57.0,0.0,0.507,...,0.28,0.130,0.034,0.031,0.0,0.0,0.76,0.0,0.0,92.07
"Taro leaves, raw",100.0,42.0,0.7,0.2,0.0,3.0,12.8,126.0,0.0,1.513,...,0.74,0.151,0.060,0.307,0.0,0.0,1.92,0.0,0.0,85.66
"PACE, Picante Sauce",100.0,25.0,0.0,,0.0,781.0,0.0,0.0,0.0,0.000,...,0.00,0.000,0.000,0.000,0.0,0.0,3.85,0.0,0.0,89.90
"Mango nectar, canned",100.0,51.0,0.1,,0.0,5.0,1.5,7.0,0.0,0.080,...,0.06,0.014,0.022,0.011,0.0,0.0,0.08,0.0,0.0,86.63
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
"Beverages, added calcium, high vitamin C, greater than 3% fruit juice, reduced sugar, Fruit flavored drink",100.0,29.0,0.4,,0.0,25.0,0.1,2.0,0.0,0.000,...,0.37,0.000,0.000,0.000,0.0,0.0,0.06,0.0,0.0,93.00
"Ruby Red grapefruit juice blend (grapefruit, grape, apple), with added vitamin C, bottled, OCEAN SPRAY",100.0,44.0,0.1,,0.0,8.0,0.0,0.0,0.0,0.000,...,0.10,0.008,0.008,0.014,0.0,0.0,0.27,0.0,0.0,88.60
"Beverages, prepared with water, frozen concentrate, with juice and pulp, breakfast type, Orange drink",100.0,45.0,0.0,,0.0,10.0,0.0,0.0,0.0,0.253,...,0.00,0.001,0.001,0.001,0.0,0.0,0.48,0.0,0.0,88.08
"Apple juice, diluted with 3 volume water without added ascorbic acid, unsweetened, frozen concentrate",100.0,47.0,0.1,,0.0,7.0,1.8,0.0,0.0,0.038,...,0.10,0.018,0.002,0.031,0.0,0.0,0.32,0.0,0.0,87.90


In [247]:
nutrition[nutrition.calories.between(20,60)].sample(4)

Unnamed: 0_level_0,serving_size_g,calories,total_fat_g,saturated_fat_g,cholesterol_mg,sodium_mg,choline_mg,folate_mcg,folic_acid_mcg,niacin_mg,...,fat_g,saturated_fatty_acids_g,monounsaturated_fatty_acids_g,polyunsaturated_fatty_acids_g,fatty_acids_total_trans_mg,alcohol_g,ash_g,caffeine_mg,theobromine_mg,water_g
name,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
"Mushrooms, without salt, cooked, shiitake",100.0,56.0,0.2,0.1,0.0,4.0,36.8,21.0,0.0,1.5,...,0.22,0.05,0.07,0.034,0.0,0.0,0.35,0.0,0.0,83.48
"Babyfood, strained, vegetables and turkey, dinner",100.0,48.0,0.9,0.2,4.0,20.0,6.7,10.0,0.0,0.466,...,0.9,0.236,0.294,0.241,4.0,0.0,0.35,0.0,0.0,88.82
"Gravy, turkey, CAMPBELL'S",100.0,42.0,1.7,0.8,0.0,458.0,0.0,0.0,0.0,0.0,...,1.69,0.847,0.0,0.0,0.0,0.0,1.73,0.0,0.0,89.8
"Mushrooms, without salt, drained, boiled, cooked, white",100.0,28.0,0.5,0.1,0.0,2.0,20.4,18.0,0.0,4.46,...,0.47,0.061,0.008,0.183,0.0,0.0,0.99,0.0,0.0,91.08


## 97. DataFrame nlargest() and nsmallest()

In [249]:
nutrition.potassium_mg.sort_values(ascending=False).head(10)

name
Leavening agents, cream of tartar                         16500.0
Leavening agents, low-sodium, baking powder               10100.0
Parsley, freeze-dried                                      6300.0
Beverages, unsweetened, decaffeinated, instant, tea        6040.0
Beverages, powder, unsweetened, instant, tea               6040.0
Spices, dried, chervil                                     4740.0
Spices, dried, coriander leaf                              4466.0
Celery flakes, dried                                       4388.0
Beverages, powder, regular, instant, coffee                3535.0
Beverages, half the caffeine, regular, instant, coffee     3535.0
Name: potassium_mg, dtype: float64

In [250]:
nutrition.columns

Index(['serving_size_g', 'calories', 'total_fat_g', 'saturated_fat_g',
       'cholesterol_mg', 'sodium_mg', 'choline_mg', 'folate_mcg',
       'folic_acid_mcg', 'niacin_mg', 'pantothenic_acid_mg', 'riboflavin_mg',
       'thiamin_mg', 'vitamin_a_IU', 'vitamin_a_rae_mcg', 'carotene_alpha_mcg',
       'carotene_beta_mcg', 'cryptoxanthin_beta_mcg', 'lutein_zeaxanthin_mcg',
       'lucopene', 'vitamin_b12_mcg', 'vitamin_b6_mg', 'vitamin_c_mg',
       'vitamin_d_IU', 'vitamin_e_mg', 'tocopherol_alpha_mg', 'vitamin_k_mcg',
       'calcium_mg', 'copper_mg', 'irom_mg', 'magnesium_mg', 'manganese_mg',
       'phosphorous_mg', 'potassium_mg', 'selenium_mcg', 'zink_mg',
       'protein_g', 'alanine_g', 'arginine_g', 'aspartic_acid_g', 'cystine_g',
       'glutamic_acid_g', 'glycine_g', 'histidine_g', 'hydroxyproline',
       'isoleucine_g', 'leucine_g', 'lysine_g', 'methionine_g',
       'phenylalanine_g', 'proline_g', 'serine_g', 'threonine_g',
       'tryptophan_g', 'tyrosine_g', 'valine_g', '

In [251]:
nutrition.nlargest(10, columns='potassium_mg')

Unnamed: 0_level_0,serving_size_g,calories,total_fat_g,saturated_fat_g,cholesterol_mg,sodium_mg,choline_mg,folate_mcg,folic_acid_mcg,niacin_mg,...,fat_g,saturated_fatty_acids_g,monounsaturated_fatty_acids_g,polyunsaturated_fatty_acids_g,fatty_acids_total_trans_mg,alcohol_g,ash_g,caffeine_mg,theobromine_mg,water_g
name,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
"Leavening agents, cream of tartar",100.0,258.0,0.0,,0.0,52.0,0.0,0.0,0.0,0.0,...,0.0,0.0,0.0,0.0,0.0,0.0,36.8,0.0,0.0,1.7
"Leavening agents, low-sodium, baking powder",100.0,97.0,0.4,0.1,0.0,90.0,0.0,0.0,0.0,0.0,...,0.4,0.073,0.006,0.121,0.0,0.0,46.4,0.0,0.0,6.2
"Parsley, freeze-dried",100.0,271.0,5.2,,0.0,391.0,0.0,194.0,0.0,10.4,...,5.2,0.0,0.0,0.0,0.0,0.0,19.12,0.0,0.0,2.0
"Beverages, powder, unsweetened, instant, tea",100.0,315.0,0.0,,0.0,72.0,118.3,103.0,0.0,10.8,...,0.0,0.0,0.0,0.0,0.0,0.0,16.04,5714.0,71.0,5.09
"Beverages, unsweetened, decaffeinated, instant, tea",100.0,315.0,0.0,,0.0,72.0,118.3,103.0,0.0,10.8,...,0.0,0.0,0.0,0.0,0.0,0.0,16.04,169.0,11.0,5.09
"Spices, dried, chervil",100.0,237.0,3.9,0.2,0.0,83.0,0.0,274.0,0.0,5.4,...,3.9,0.169,1.399,1.8,0.0,0.0,16.6,0.0,0.0,7.2
"Spices, dried, coriander leaf",100.0,279.0,4.8,0.1,0.0,211.0,97.1,274.0,0.0,10.707,...,4.78,0.115,2.232,0.328,0.0,0.0,14.08,0.0,0.0,7.3
"Celery flakes, dried",100.0,319.0,2.1,0.6,0.0,1435.0,122.3,107.0,0.0,4.64,...,2.1,0.555,0.405,1.035,0.0,0.0,13.9,0.0,0.0,9.0
"Beverages, powder, regular, instant, coffee",100.0,353.0,0.5,0.2,0.0,37.0,101.9,0.0,0.0,28.173,...,0.5,0.197,0.041,0.196,0.0,0.0,8.8,3142.0,0.0,3.1
"Beverages, half the caffeine, regular, instant, coffee",100.0,352.0,0.5,0.2,0.0,37.0,101.9,0.0,0.0,28.173,...,0.5,0.197,0.041,0.196,0.0,0.0,8.8,1571.0,0.0,3.1


In [252]:
nutrition.nlargest(10, columns='potassium_mg').potassium_mg

name
Leavening agents, cream of tartar                         16500.0
Leavening agents, low-sodium, baking powder               10100.0
Parsley, freeze-dried                                      6300.0
Beverages, powder, unsweetened, instant, tea               6040.0
Beverages, unsweetened, decaffeinated, instant, tea        6040.0
Spices, dried, chervil                                     4740.0
Spices, dried, coriander leaf                              4466.0
Celery flakes, dried                                       4388.0
Beverages, powder, regular, instant, coffee                3535.0
Beverages, half the caffeine, regular, instant, coffee     3535.0
Name: potassium_mg, dtype: float64

In [253]:
nutrition.potassium_mg.nlargest(10)

name
Leavening agents, cream of tartar                         16500.0
Leavening agents, low-sodium, baking powder               10100.0
Parsley, freeze-dried                                      6300.0
Beverages, powder, unsweetened, instant, tea               6040.0
Beverages, unsweetened, decaffeinated, instant, tea        6040.0
Spices, dried, chervil                                     4740.0
Spices, dried, coriander leaf                              4466.0
Celery flakes, dried                                       4388.0
Beverages, powder, regular, instant, coffee                3535.0
Beverages, half the caffeine, regular, instant, coffee     3535.0
Name: potassium_mg, dtype: float64

In [254]:
nutrition.nsmallest(10, ['sodium_mg','calories']).head()

Unnamed: 0_level_0,serving_size_g,calories,total_fat_g,saturated_fat_g,cholesterol_mg,sodium_mg,choline_mg,folate_mcg,folic_acid_mcg,niacin_mg,...,fat_g,saturated_fatty_acids_g,monounsaturated_fatty_acids_g,polyunsaturated_fatty_acids_g,fatty_acids_total_trans_mg,alcohol_g,ash_g,caffeine_mg,theobromine_mg,water_g
name,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
"Beverages, well, tap, water",100.0,0.0,0.0,,0.0,0.0,0.0,0.0,0.0,0.0,...,0.0,0.0,0.0,0.0,0.0,0.0,0.1,0.0,0.0,99.9
"Water, NAYA, non-carbonated, bottled",100.0,0.0,0.0,,0.0,0.0,0.0,0.0,0.0,0.0,...,0.0,0.0,0.0,0.0,0.0,0.0,0.1,0.0,0.0,100.0
"Beverages, decaffeinated, brewed, green, tea",100.0,0.0,0.0,,0.0,0.0,0.0,0.0,0.0,0.03,...,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,99.93
"Beverages, EVIAN, non-carbonated, bottled, water",100.0,0.0,0.0,,0.0,0.0,0.0,0.0,0.0,0.0,...,0.0,0.0,0.0,0.0,0.0,0.0,0.05,0.0,0.0,99.97
"Beverages, CALISTOGA, non-carbonated, bottled, water",100.0,0.0,0.0,,0.0,0.0,0.0,0.0,0.0,0.0,...,0.0,0.0,0.0,0.0,0.0,0.0,0.1,0.0,0.0,100.0


## 98. Skill Challenge

## 99. Solution

In [257]:
#1

In [258]:
nutrition.loc[:,'vitamin_b12_mcg'].nlargest(10)

name
Mollusks, moist heat, cooked, mixed species, clam                                   98.89
Beef, boiled, cooked, variety meats and by-products liver, imported, New Zealand    96.00
Lamb, raw, liver, variety meats and by-products                                     90.05
Lamb, pan-fried, cooked, liver, variety meats and by-products                       85.70
Veal, braised, cooked, liver, variety meats and by-products                         84.60
Beef, raw, liver, variety meats and by-products, imported, New Zealand              84.50
Beef, pan-fried, cooked, liver, variety meats and by-products                       83.13
Lamb, braised, cooked, kidneys, variety meats and by-products                       78.90
Lamb, braised, cooked, liver, variety meats and by-products                         76.50
Veal, pan-fried, cooked, liver, variety meats and by-products                       72.50
Name: vitamin_b12_mcg, dtype: float64

In [259]:
nutrition.vitamin_b12_mcg.nlargest(10)

name
Mollusks, moist heat, cooked, mixed species, clam                                   98.89
Beef, boiled, cooked, variety meats and by-products liver, imported, New Zealand    96.00
Lamb, raw, liver, variety meats and by-products                                     90.05
Lamb, pan-fried, cooked, liver, variety meats and by-products                       85.70
Veal, braised, cooked, liver, variety meats and by-products                         84.60
Beef, raw, liver, variety meats and by-products, imported, New Zealand              84.50
Beef, pan-fried, cooked, liver, variety meats and by-products                       83.13
Lamb, braised, cooked, kidneys, variety meats and by-products                       78.90
Lamb, braised, cooked, liver, variety meats and by-products                         76.50
Veal, pan-fried, cooked, liver, variety meats and by-products                       72.50
Name: vitamin_b12_mcg, dtype: float64

In [260]:
nutrition.nlargest(n=10, columns='vitamin_b12_mcg').vitamin_b12_mcg

name
Mollusks, moist heat, cooked, mixed species, clam                                   98.89
Beef, boiled, cooked, variety meats and by-products liver, imported, New Zealand    96.00
Lamb, raw, liver, variety meats and by-products                                     90.05
Lamb, pan-fried, cooked, liver, variety meats and by-products                       85.70
Veal, braised, cooked, liver, variety meats and by-products                         84.60
Beef, raw, liver, variety meats and by-products, imported, New Zealand              84.50
Beef, pan-fried, cooked, liver, variety meats and by-products                       83.13
Lamb, braised, cooked, kidneys, variety meats and by-products                       78.90
Lamb, braised, cooked, liver, variety meats and by-products                         76.50
Veal, pan-fried, cooked, liver, variety meats and by-products                       72.50
Name: vitamin_b12_mcg, dtype: float64

In [261]:
nutrition.sort_values(by='vitamin_b12_mcg', ascending=False).head(10).vitamin_b12_mcg

name
Mollusks, moist heat, cooked, mixed species, clam                                   98.89
Beef, boiled, cooked, variety meats and by-products liver, imported, New Zealand    96.00
Lamb, raw, liver, variety meats and by-products                                     90.05
Lamb, pan-fried, cooked, liver, variety meats and by-products                       85.70
Veal, braised, cooked, liver, variety meats and by-products                         84.60
Beef, raw, liver, variety meats and by-products, imported, New Zealand              84.50
Beef, pan-fried, cooked, liver, variety meats and by-products                       83.13
Lamb, braised, cooked, kidneys, variety meats and by-products                       78.90
Lamb, braised, cooked, liver, variety meats and by-products                         76.50
Veal, pan-fried, cooked, liver, variety meats and by-products                       72.50
Name: vitamin_b12_mcg, dtype: float64

In [262]:
#2

In [263]:
nutrition.filter(regex='(?i)ggplant', axis=0)

Unnamed: 0_level_0,serving_size_g,calories,total_fat_g,saturated_fat_g,cholesterol_mg,sodium_mg,choline_mg,folate_mcg,folic_acid_mcg,niacin_mg,...,fat_g,saturated_fatty_acids_g,monounsaturated_fatty_acids_g,polyunsaturated_fatty_acids_g,fatty_acids_total_trans_mg,alcohol_g,ash_g,caffeine_mg,theobromine_mg,water_g
name,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
"Eggplant, raw",100.0,25.0,0.2,,0.0,2.0,6.9,22.0,0.0,0.649,...,0.18,0.034,0.016,0.076,0.0,0.0,0.66,0.0,0.0,92.3
"Eggplant, pickled",100.0,49.0,0.7,0.1,0.0,1674.0,11.9,20.0,0.0,0.66,...,0.7,0.14,0.063,0.294,0.0,0.0,1.73,0.0,0.0,86.9
"Eggplant, with salt, drained, boiled, cooked",100.0,33.0,0.2,,0.0,239.0,9.4,14.0,0.0,0.6,...,0.23,0.044,0.02,0.093,0.0,0.0,1.13,0.0,0.0,89.67
"Eggplant, without salt, drained, boiled, cooked",100.0,35.0,0.2,,0.0,1.0,9.4,14.0,0.0,0.6,...,0.23,0.044,0.02,0.093,0.0,0.0,0.54,0.0,0.0,89.67


In [264]:
nutrition.filter(regex='(?i)ggplant', axis=0).sodium_mg.nlargest(1)

name
Eggplant, pickled    1674.0
Name: sodium_mg, dtype: float64

In [265]:
#3

In [266]:
nutrition.sample(4, axis=0).sample(4, axis=1)

Unnamed: 0_level_0,ash_g,cholesterol_mg,theobromine_mg,tryptophan_g
name,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1
"Cocoa, unsweetened, dry powder",5.8,0.0,2057.0,0.293
"Margarine-like, with salt, stick/tub/bottle, 60% fat, vegetable oil spread",1.7,1.0,0.0,0.0
"Babyfood, strained, without vitamin c, prunes",0.98,0.0,0.0,0.0
"CAMPBELL'S Soup on the Go, Creamy Broccoli Soup",0.95,2.0,0.0,0.0


## 100. Another Skill Challenge

## 101. Solution

In [541]:
nutrition.dropna(axis=0, how='any', inplace=True)

In [545]:
nutrition.shape

(7199, 75)

In [559]:
nutrition[nutrition.vitamin_c_mg.between(20,40)].calories.nsmallest(1)

name
Asparagus, with salt, drained, boiled, cooked, frozen    18.0
Name: calories, dtype: float64

In [563]:
m = nutrition.vitamin_c_mg.mean()

In [567]:
mp2sd = m + nutrition.vitamin_c_mg.std() * 2

In [571]:
mp3sd = m + nutrition.vitamin_c_mg.std() * 3

In [569]:
m

5.553368523406029

In [573]:
print(m, mp2sd, mp3sd)

5.553368523406029 97.7621389681903 143.86652419058242


In [575]:
nutrition[nutrition.vitamin_c_mg.between(mp2sd, mp3sd)]

Unnamed: 0_level_0,serving_size_g,calories,total_fat_g,saturated_fat_g,cholesterol_mg,sodium_mg,choline_mg,folate_mcg,folic_acid_mcg,niacin_mg,...,fat_g,saturated_fatty_acids_g,monounsaturated_fatty_acids_g,polyunsaturated_fatty_acids_g,fatty_acids_total_trans_mg,alcohol_g,ash_g,caffeine_mg,theobromine_mg,water_g
name,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
"Peppers, raw, jalapeno",100.0,29.0,0.4,0.1,0.0,3.0,7.5,27.0,0.0,1.28,...,0.37,0.092,0.029,0.112,0.0,0.0,0.53,0.0,0.0,91.69
"Kale, raw, scotch",100.0,42.0,0.6,0.1,0.0,70.0,0.0,28.0,0.0,1.3,...,0.6,0.078,0.045,0.289,0.0,0.0,1.28,0.0,0.0,87.0
"Parsley, fresh",100.0,36.0,0.8,0.1,0.0,56.0,12.8,152.0,0.0,1.313,...,0.79,0.132,0.295,0.124,0.0,0.0,2.2,0.0,0.0,87.71
Tomato powder,100.0,302.0,0.4,0.1,0.0,134.0,0.0,120.0,0.0,9.133,...,0.44,0.062,0.066,0.179,0.0,0.0,8.91,0.0,0.0,3.06
"Kale, raw",100.0,49.0,0.9,0.1,0.0,38.0,0.8,141.0,0.0,1.0,...,0.93,0.091,0.052,0.338,0.0,0.0,2.01,0.0,0.0,84.04
"Snacks, rolls, fruit leather",100.0,371.0,3.0,0.7,0.0,317.0,13.2,2.0,0.0,0.1,...,3.0,0.672,1.48,0.552,0.0,0.0,0.9,0.0,0.0,10.2
"Spices, dried, parsley",100.0,292.0,5.5,1.4,0.0,452.0,97.1,180.0,0.0,9.943,...,5.48,1.378,0.761,3.124,0.0,0.0,11.36,0.0,0.0,5.89
"Tomatoes, drained, packed in oil, sun-dried",100.0,213.0,14.0,1.9,0.0,266.0,0.0,23.0,0.0,3.63,...,14.08,1.893,8.663,2.06,0.0,0.0,3.7,0.0,0.0,53.83
"Snacks, with vitamin C, pieces, fruit leather",100.0,373.0,3.5,1.0,0.0,317.0,0.0,14.0,0.0,0.1,...,3.5,0.99,1.724,0.093,0.0,0.0,1.0,0.0,0.0,10.2
"Cereals ready-to-eat, HEALTH VALLEY, OAT BRAN FLAKES",100.0,380.0,3.0,1.0,0.0,380.0,22.9,200.0,181.0,10.0,...,3.0,1.0,0.704,0.897,0.0,0.0,5.53,0.0,0.0,3.4


In [577]:
nutrition[nutrition.vitamin_c_mg.between(mp2sd, mp3sd)].shape

(17, 75)

In [579]:
result_set = nutrition[nutrition.vitamin_c_mg.between(mp2sd, mp3sd)]

In [583]:
result_set.describe()

Unnamed: 0,serving_size_g,calories,total_fat_g,saturated_fat_g,cholesterol_mg,sodium_mg,choline_mg,folate_mcg,folic_acid_mcg,niacin_mg,...,fat_g,saturated_fatty_acids_g,monounsaturated_fatty_acids_g,polyunsaturated_fatty_acids_g,fatty_acids_total_trans_mg,alcohol_g,ash_g,caffeine_mg,theobromine_mg,water_g
count,17.0,17.0,17.0,17.0,17.0,17.0,17.0,17.0,17.0,17.0,...,17.0,17.0,17.0,17.0,17.0,17.0,17.0,17.0,17.0,17.0
mean,100.0,254.588235,4.129412,0.964706,3.411765,267.588235,32.994118,139.882353,72.058824,7.618235,...,4.112941,0.946882,1.768353,0.954471,3.411765,0.0,3.882941,3.705882,41.588235,31.429412
std,0.0,140.672074,4.693581,1.134648,10.718319,215.914062,66.390535,150.379887,151.563712,10.817866,...,4.663148,1.136581,2.854251,1.288771,10.718319,0.0,3.49288,12.726767,147.915119,36.400353
min,100.0,29.0,0.4,0.1,0.0,3.0,0.0,0.0,0.0,0.0,...,0.37,0.062,0.029,0.093,0.0,0.0,0.53,0.0,0.0,2.0
25%,100.0,146.0,0.8,0.1,0.0,56.0,0.0,23.0,0.0,1.0,...,0.79,0.092,0.063,0.124,0.0,0.0,1.0,0.0,0.0,5.89
50%,100.0,302.0,3.0,0.7,0.0,317.0,7.5,120.0,0.0,3.397,...,3.0,0.672,0.704,0.338,0.0,0.0,2.84,0.0,0.0,10.2
75%,100.0,371.0,5.1,1.4,0.0,429.0,24.5,180.0,0.0,9.943,...,5.1,1.36,1.724,1.07,0.0,0.0,5.53,0.0,0.0,62.0
max,100.0,422.0,14.0,4.5,44.0,717.0,266.9,500.0,500.0,38.442,...,14.08,4.499,9.11,4.804,44.0,0.0,11.36,52.0,608.0,91.69
