In [174]:
import pandas as pd
pd.set_option('display.max_columns', None)
pd.set_option('display.max_rows', None)

import csv
import re

import numpy as np
import math

from sklearn import preprocessing

## Extrating the Train Data

In [176]:
df = pd.DataFrame(pd.read_json('distiller_20200330.json'))
df.insert(0,'id', range(len(df)))
df.reset_index(drop=True)
df.sample(5)

Unnamed: 0,id,abv,age,average_user_rating,brand_name,cost_level,description,expert_rating,flavor_profile,name,origin,reviewer,tasting_notes,type,user_comments
1954,1954,40.0,,,Puerto Angel,2,Produced in a distillery located in the Oaxaca...,86.0,"{'earthy': 0, 'floral': 20, 'fruity': 40, 'her...",Puerto Angel Blanco Rum,Mexico,Paul Senft,The aroma delivers an interesting balance of m...,Silver Rum,0
7215,7215,48.0,,77.0,Kilchoman,4,This vintage bottling from Kilchoman is a vatt...,91.0,"{'briny': 25, 'floral': 20, 'fruity': 30, 'ful...",Kilchoman Vintage 2010,"Islay, Scotland",Jacob Grier,This is assertively peated whisky with some oo...,Peated Single Malt,5
5376,5376,40.0,,66.8,E & J,1,E&J distillers is owned by the Ernest and Juli...,,,E&J XO Brandy,"California, USA",,,American Brandy,38
2643,2643,46.0,,67.6,Finlaggan,2,"Family-run independent bottler, The Vintage Ma...",,,Finlaggan Eilean Mòr,"Islay, Scotland",,,Peated Single Malt,31
4591,4591,50.0,,68.0,Heaven Hill,1,"Old Fitzgerald, a product of Heaven Hills Dist...",84.0,"{'briny': 0, 'floral': 40, 'fruity': 64, 'full...",Old Fitzgerald Bottled In Bond Bourbon,"Kentucky, USA",Ryan Conklin,The nose on this whiskey is round with a good ...,Bourbon,75


In [177]:
df.to_csv('distiller_20200330.csv', index=False)

In [178]:
df = df[(df['tasting_notes'].isnull() == False) & (df['flavor_profile'].isnull() == False)]
print(len(df))

df = df[['id','type','expert_rating','tasting_notes','flavor_profile']]
df.head(5)

3513


Unnamed: 0,id,type,expert_rating,tasting_notes,flavor_profile
5,5,Canadian,95.0,This rye beast is crammed with so many spices ...,"{'briny': 0, 'floral': 45, 'fruity': 45, 'full..."
6,6,American Brandy,75.0,The aromatics of this brandy have a strong app...,"{'earthy': 5, 'floral': 10, 'fruity': 75, 'her..."
7,7,Old Tom Gin,90.0,Sweet spices and floral aromas are found as yo...,"{'bitter': 10, 'chemical': 0, 'earthy': 45, 'f..."
11,11,Other Whiskey,84.0,"The nose is floral, with honey, hay, citrus ze...","{'briny': 0, 'floral': 50, 'fruity': 20, 'full..."
12,12,Flavored Whiskey,84.0,The nose is at first difficult to find behind ...,"{'briny': 0, 'floral': 10, 'fruity': 30, 'full..."


In [179]:
df.sample(5)

Unnamed: 0,id,type,expert_rating,tasting_notes,flavor_profile
2969,2969,Navy Rum,80.0,This product's strong aroma is flush with note...,"{'earthy': 75, 'floral': 40, 'fruity': 20, 'he..."
591,591,Amaro,90.0,Cynar's deep amber color accurately hints at i...,"{'bitter': 95, 'earthy': 50, 'floral': 0, 'fru..."
1159,1159,London Dry Gin,87.0,The aroma is much more aromatic with the sweet...,"{'bitter': 10, 'chemical': 0, 'earthy': 25, 'f..."
4944,4944,Canadian,87.0,This whisky hits hard with a sweet nose brimmi...,"{'briny': 0, 'floral': 30, 'fruity': 45, 'full..."
1113,1113,Single Malt,86.0,Israel isn't the first country one thinks of f...,"{'briny': 30, 'floral': 25, 'fruity': 30, 'ful..."


### Exporting as new CSV

In [180]:
df.to_csv('train_raw.csv')

## Re-organize the Data

In [181]:
id_ = []
name = []
flavor_profile = []
tasting_notes = []
expert_rating = []
type_ = []

flavor_data = []

with open('train_raw.csv', 'r', newline='', encoding="utf-8") as file:
    reader = csv.reader(file)
    
    for row in reader: 
        
        i = row[0]
        n = row[1]
        c = row[2]
        flavor = row[5].strip('{').strip('}\r').split(',')
        note = row[4].strip()
        rating = row[3]
        
        flavors = []
        
        for item in flavor:
            items = item.strip().split(':')

            flavors.append(items)              
        
        id_.append(i)
        name.append(n)
        flavor_data.append(flavors)
        tasting_notes.append(note)
        expert_rating.append(rating)
        type_.append(c)
        
        
del id_[0]
del name[0]
del type_[0]
del flavor_data[0]  
del tasting_notes[0]
del expert_rating[0]

for line in flavor_data:
    flavor_profile.append(dict(line))

## Allocating Type to Category

In [182]:
type_list = []

for item in type_:
    type_list.append(item)

type_list = list(set(type_list))

print(type_list)

['Flavored Whiskey', 'Other Brandy', 'Sotol Blanco', 'Tequila Mixto Blanco', 'Rhum Agricole Éléve Sous Bois', 'Flavored Rum', 'Rye', 'Mezcal Joven', 'Aged Rum', 'Cognac', 'Barrel-Aged Gin', 'Eau-de-Vie', 'Flavored Gin', 'Spiced Rum', 'Tequila Añejo', 'Unflavored Vodka', 'Blended Grain', 'Calvados', 'Wheat Whiskey', 'Other Agave', 'Chocolate Liqueurs', 'Old Tom Gin', 'Blended', 'Sloe Gin & Variants', 'Pisco', 'Silver Rum', 'Genever-Style', 'Navy-Strength Gin', 'Bourbon', 'Armagnac', 'London Dry Gin', 'Single Pot Still', 'Tennessee', 'Coffee Liqueurs', 'Distilled Gin', 'Modern Gin', 'Single Grain', 'Other Liqueurs', 'White', 'Rhum Agricole Blanc', 'Nut Liqueurs', 'Spirit', 'Gold Rum', 'Tequila Mixto Gold', 'Floral Liqueurs', 'Other Sugarcane', 'Canadian', 'American Brandy', 'Tequila Reposado', 'Blended American Whiskey', 'Corn', 'Single Malt', 'Blended Malt', 'Bitter Liqueurs', 'Genever', 'Triple Sec/Curaçao', 'Grappa/Marc', 'Fruit Liqueurs', 'Peated Single Malt', 'Herbal/Spice Liqueurs'

In [183]:
category= []

category_list = ['Whiskey', 'Brandy', 'Rum', 'Gin', 'Vodka', 'Tequila', 'Liqueurs/Bitters']

whiskey_list = ['Blended Malt', 'Tennessee', 'Peated Single Malt', 'Single Grain', 'Blended', 'Flavored Whiskey', 'Corn', 
                'American Single Malt', 'Blended Grain', 'Blended American Whiskey', 'Rye', 'Bourbon', 'Other Whiskey',
                'Single Malt', 'Wheat Whiskey', 'White', 'Peated Blend', 'Peated Blended Malt', 'Spirit', 'Single Pot Still',
                'Canadian', ]

brandy_list = ['Eau-de-Vie', 'Other Brandy', 'Grappa/Marc',  'Cognac', 'Armagnac', 'Calvados', 'Blanche Armagnac', 'American Brandy',
              'Pisco', ]

rum_list = ['Rhum Agricole Éléve Sous Bois', 'Spiced Rum', 'Gold Rum', 'Aged Rum', 'Aguardiente', 'Flavored Rum', 'Navy Rum',
            'Rhum Agricole Blanc', 'Cachaça', 'Dark Rum', 'Silver Rum', 'Rhum Agricole Vieux', 'Other Sugarcane']

gin_list = ['Distilled Gin', 'Flavored Gin', 'Old Tom Gin', 'Plymouth Gin', 'London Dry Gin', 'Navy-Strength Gin', 
            'Gin de Mahón', 'Compound Gin', 'Genever', 'Modern Gin', 'Genever-Style', 'Barrel-Aged Gin']

vodka_list = ['Unflavored Vodka', 'Flavored Vodka', ]

tequila_list = ['Tequila Añejo', 'Tequila Blanco', 'Tequila Mixto Blanco', 'Tequila Joven', 'Tequila Extra Añejo', 'Mezcal Joven',
               'Raicilla Blanco', 'Tequila Mixto Gold', 'Mezcal Reposado', 'Other Agave', 'Sotol Blanco', 'Tequila Reposado',
               'Sotol Añejo', 'Mezcal Añejo', ]

liqueur_list = ['Bitter Liqueurs', 'Sloe Gin & Variants', 'Chocolate Liqueurs', 'Other Liqueurs', 'Herbal/Spice Liqueurs',
                'Coffee Liqueurs', 'Amaro', 'Triple Sec/Curaçao', 'Fruit Liqueurs', 'Nut Liqueurs', 'Floral Liqueurs', 
                'Dairy/Egg Liqueurs']

for item in type_:

    if item in whiskey_list:
        category.append(category_list[0])
    
    elif item in brandy_list:
        category.append(category_list[1])
        
    elif item in rum_list:
        category.append(category_list[2])
        
    elif item in gin_list:
        category.append(category_list[3])
        
    elif item in vodka_list:
        category.append(category_list[4])
        
    elif item in tequila_list:
        category.append(category_list[5])
        
    else:
        category.append(category_list[6])     

print(type_[-10:-1])            
print(category[-10:-1])

['London Dry Gin', 'Single Malt', 'Gold Rum', 'Cachaça', 'Canadian', 'Spiced Rum', 'American Brandy', 'Amaro', 'Flavored Vodka']
['Gin', 'Whiskey', 'Rum', 'Rum', 'Whiskey', 'Rum', 'Brandy', 'Liqueurs/Bitters', 'Vodka']


## Check the Data

In [184]:
print(len(flavor_profile))
print(type(flavor_profile[-1]))
# print(flavor_profile[0].keys())
# print(flavor_profile[0].values())
print(flavor_profile[-1])

3513
<class 'dict'>
{"'bitter'": ' 0', "'earthy'": ' 10', "'floral'": ' 10', "'fruity'": ' 40', "'herbal'": ' 50', "'mineral'": ' 10', "'oily'": ' 15', "'rich'": ' 30', "'salty'": ' 5', "'smoky'": ' 25', "'spicy'": ' 20', "'sweet'": ' 60', "'tart'": ' 0', "'umami'": ' 5'}


In [185]:
print(len(tasting_notes))
print(type(tasting_notes[-1]))
print(tasting_notes[-1])

3513
<class 'str'>
As unharmonious as those donkeys might be, the flavors of this mezcal are quite the opposite - everything plays together with each pleasurable sip. It has a subtle, sweet and light smoke, with a minty and peppery finish. Roasted agave fruit flavors really shine through with a light, dewy mouthfeel.


In [186]:
print(len(expert_rating))
print(type(expert_rating[0]))
print(expert_rating[0])

3513
<class 'str'>
95.0


## Extracting Flavor Profile Labels

In [187]:
flavor_labels = set()

for keys in flavor_profile:
    for key in keys.keys():
        flavor_labels.add(key)
    
label_list = list(flavor_labels)
print(label_list)
print(len(label_list))

["'rich'", "'chemical'", "'tart'", "'peaty'", "'spicy'", "'floral'", "'bitter'", "'juniper'", "'salty'", "'hogo'", "'nutty'", "'fruity'", "'umami'", "'neutral'", "'rancio'", "'roast'", "'mineral'", "'grain'", "'sweet'", "'briny'", "'vanilla'", "'oily'", "'harsh'", "'full_bodied'", "'earthy'", "'herbal'", "'woody'", "'smoky'"]
28


## Emerging to the New Data

In [188]:
import math

new_data = []

for item in flavor_profile:

    new_keys = []
    new_values = []
    
    for key in item:
    
        for label in label_list:
            if label in item.keys():

                new_keys.append(key.strip("'"))
                new_values.append(math.ceil(int(item[key])/20))
            
            elif label not in item.keys():
                
                new_keys.append(label.strip("'"))
                new_values.append(0)
                
    flavors = dict(zip(new_keys, new_values))
    
    new_data.append(flavors)

In [189]:
print(len(new_data), type(new_data))
print(new_data[-1], type(new_data[-1]))

3513 <class 'list'>
{'bitter': 0, 'chemical': 0, 'peaty': 0, 'juniper': 0, 'hogo': 0, 'nutty': 0, 'neutral': 0, 'rancio': 0, 'roast': 0, 'grain': 0, 'briny': 0, 'vanilla': 0, 'harsh': 0, 'full_bodied': 0, 'woody': 0, 'earthy': 1, 'floral': 1, 'fruity': 2, 'herbal': 3, 'mineral': 1, 'oily': 1, 'rich': 2, 'salty': 1, 'smoky': 2, 'spicy': 1, 'sweet': 3, 'tart': 0, 'umami': 1} <class 'dict'>


In [190]:
for index, item in enumerate(new_data):

    for key in item:
        item[key] = int(item[key])
        #item[key] = flavor_scale[item[key]]
        
    item['id'] = id_[index]
    item['rating'] = round(float(expert_rating[index]))
    item['category'] = category[index]
    item['tasting_notes'] = tasting_notes[index]

In [191]:
new_data[0]

{'briny': 0,
 'chemical': 0,
 'bitter': 0,
 'juniper': 0,
 'hogo': 0,
 'nutty': 0,
 'umami': 0,
 'neutral': 0,
 'rancio': 0,
 'roast': 0,
 'mineral': 0,
 'grain': 0,
 'harsh': 0,
 'earthy': 0,
 'woody': 0,
 'floral': 3,
 'fruity': 3,
 'full_bodied': 3,
 'herbal': 1,
 'oily': 2,
 'peaty': 0,
 'rich': 3,
 'salty': 0,
 'smoky': 2,
 'spicy': 4,
 'sweet': 2,
 'tart': 1,
 'vanilla': 2,
 'id': '5',
 'rating': 95,
 'category': 'Whiskey',
 'tasting_notes': 'This rye beast is crammed with so many spices that a copper label is fitted to the bottle to brace it from bulging. Fruity spring flowers and freshly baked rye bread flood from the whisky. And not just any rye bread, but the kind they teach in a prison baking class. The robust rye spices and bottomless oak rumble on the palate with a delicate caramel that pulls its own weight. The Energizer Bunny’s mentor is the endless finish. An instant classic.'}

### Multi-Hot Encoding the Labels

In [192]:
df = pd.DataFrame(new_data)
df_text = df.iloc[:,-1:]
df_label = df.iloc[:, 0:-4] 

In [193]:
df = pd.DataFrame(df['id']).join(df_text)
df = df.join(df_label)
df.head()

Unnamed: 0,id,tasting_notes,briny,chemical,bitter,juniper,hogo,nutty,umami,neutral,rancio,roast,mineral,grain,harsh,earthy,woody,floral,fruity,full_bodied,herbal,oily,peaty,rich,salty,smoky,spicy,sweet,tart,vanilla
0,5,This rye beast is crammed with so many spices ...,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,3,3,3,1,2,0,3,0,2,4,2,1,2
1,6,The aromatics of this brandy have a strong app...,0,0,0,0,0,2,0,0,1,4,0,0,0,1,5,1,4,0,1,3,0,4,0,1,0,5,0,0
2,7,Sweet spices and floral aromas are found as yo...,0,0,1,3,0,0,0,0,0,0,0,0,0,3,0,3,2,0,1,3,0,4,0,0,3,2,0,0
3,11,"The nose is floral, with honey, hay, citrus ze...",0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,3,1,3,3,2,0,3,0,1,4,3,2,3
4,12,The nose is at first difficult to find behind ...,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,2,2,3,3,0,2,0,1,2,2,1,2


In [194]:
df_labels = pd.get_dummies(df.iloc[:,2:], columns= df.iloc[:,2:].columns)
col_name = df_labels.columns.tolist()

missed_col = ['chemical_4']
insert_pos = ['chemical_5']

for index, item in enumerate(missed_col):
    col_name.insert(col_name.index(insert_pos[index]), item)  

df_labels = df_labels.reindex(columns=col_name)

df_labels.columns

Index(['briny_0', 'briny_1', 'briny_2', 'briny_3', 'briny_4', 'briny_5',
       'chemical_0', 'chemical_1', 'chemical_2', 'chemical_3',
       ...
       'tart_2', 'tart_3', 'tart_4', 'tart_5', 'vanilla_0', 'vanilla_1',
       'vanilla_2', 'vanilla_3', 'vanilla_4', 'vanilla_5'],
      dtype='object', length=168)

In [195]:
df_info = df.iloc[:,0:2]
df_labels = df_labels.fillna(0, axis=1).astype('uint8')

df2 = pd.concat([df_info, df_labels], axis=1)

print(len(df2.columns.tolist()[2:]))
df2.head(5)

168


Unnamed: 0,id,tasting_notes,briny_0,briny_1,briny_2,briny_3,briny_4,briny_5,chemical_0,chemical_1,chemical_2,chemical_3,chemical_4,chemical_5,bitter_0,bitter_1,bitter_2,bitter_3,bitter_4,bitter_5,juniper_0,juniper_1,juniper_2,juniper_3,juniper_4,juniper_5,hogo_0,hogo_1,hogo_2,hogo_3,hogo_4,hogo_5,nutty_0,nutty_1,nutty_2,nutty_3,nutty_4,nutty_5,umami_0,umami_1,umami_2,umami_3,umami_4,umami_5,neutral_0,neutral_1,neutral_2,neutral_3,neutral_4,neutral_5,rancio_0,rancio_1,rancio_2,rancio_3,rancio_4,rancio_5,roast_0,roast_1,roast_2,roast_3,roast_4,roast_5,mineral_0,mineral_1,mineral_2,mineral_3,mineral_4,mineral_5,grain_0,grain_1,grain_2,grain_3,grain_4,grain_5,harsh_0,harsh_1,harsh_2,harsh_3,harsh_4,harsh_5,earthy_0,earthy_1,earthy_2,earthy_3,earthy_4,earthy_5,woody_0,woody_1,woody_2,woody_3,woody_4,woody_5,floral_0,floral_1,floral_2,floral_3,floral_4,floral_5,fruity_0,fruity_1,fruity_2,fruity_3,fruity_4,fruity_5,full_bodied_0,full_bodied_1,full_bodied_2,full_bodied_3,full_bodied_4,full_bodied_5,herbal_0,herbal_1,herbal_2,herbal_3,herbal_4,herbal_5,oily_0,oily_1,oily_2,oily_3,oily_4,oily_5,peaty_0,peaty_1,peaty_2,peaty_3,peaty_4,peaty_5,rich_0,rich_1,rich_2,rich_3,rich_4,rich_5,salty_0,salty_1,salty_2,salty_3,salty_4,salty_5,smoky_0,smoky_1,smoky_2,smoky_3,smoky_4,smoky_5,spicy_0,spicy_1,spicy_2,spicy_3,spicy_4,spicy_5,sweet_0,sweet_1,sweet_2,sweet_3,sweet_4,sweet_5,tart_0,tart_1,tart_2,tart_3,tart_4,tart_5,vanilla_0,vanilla_1,vanilla_2,vanilla_3,vanilla_4,vanilla_5
0,5,This rye beast is crammed with so many spices ...,1,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,0,0,1,0,0,1,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,0,0,0,1,0,0,0,0,1,0,0,0,0,0,0,1,0,0,0
1,6,The aromatics of this brandy have a strong app...,1,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,0,0,1,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,1,0,1,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,1,0,1,0,0,0,0,0,0,0,0,1,0,1,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,0,0,1,0,0,0,0,0,0,0,0,0,1,0,1,0,0,0,0,0,0,1,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,1,1,0,0,0,0,0,1,0,0,0,0,0
2,7,Sweet spices and floral aromas are found as yo...,1,0,0,0,0,0,1,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,0,0,1,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,0,0,0,1,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,0,0,1,0,0,0,0,0,0,0,0,0,1,0,1,0,0,0,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,1,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0
3,11,"The nose is floral, with honey, hay, citrus ze...",1,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,0,0,1,0,0,1,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,1,0,0,0,0,1,0,0,0,0,0,0,1,0,0
4,12,The nose is at first difficult to find behind ...,1,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,0,1,0,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,0,1,0,0,0,0,0,1,0,0,1,0,0,0,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,1,0,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,1,0,0,0,0,0,0,1,0,0,0


### Exporting as CSV

In [196]:
df2.to_csv('train_data.csv', index=False)

### Basic Exploratory Data Analysis

In [197]:
round(df2.iloc[:,:].describe())

Unnamed: 0,briny_0,briny_1,briny_2,briny_3,briny_4,briny_5,chemical_0,chemical_1,chemical_2,chemical_3,chemical_4,chemical_5,bitter_0,bitter_1,bitter_2,bitter_3,bitter_4,bitter_5,juniper_0,juniper_1,juniper_2,juniper_3,juniper_4,juniper_5,hogo_0,hogo_1,hogo_2,hogo_3,hogo_4,hogo_5,nutty_0,nutty_1,nutty_2,nutty_3,nutty_4,nutty_5,umami_0,umami_1,umami_2,umami_3,umami_4,umami_5,neutral_0,neutral_1,neutral_2,neutral_3,neutral_4,neutral_5,rancio_0,rancio_1,rancio_2,rancio_3,rancio_4,rancio_5,roast_0,roast_1,roast_2,roast_3,roast_4,roast_5,mineral_0,mineral_1,mineral_2,mineral_3,mineral_4,mineral_5,grain_0,grain_1,grain_2,grain_3,grain_4,grain_5,harsh_0,harsh_1,harsh_2,harsh_3,harsh_4,harsh_5,earthy_0,earthy_1,earthy_2,earthy_3,earthy_4,earthy_5,woody_0,woody_1,woody_2,woody_3,woody_4,woody_5,floral_0,floral_1,floral_2,floral_3,floral_4,floral_5,fruity_0,fruity_1,fruity_2,fruity_3,fruity_4,fruity_5,full_bodied_0,full_bodied_1,full_bodied_2,full_bodied_3,full_bodied_4,full_bodied_5,herbal_0,herbal_1,herbal_2,herbal_3,herbal_4,herbal_5,oily_0,oily_1,oily_2,oily_3,oily_4,oily_5,peaty_0,peaty_1,peaty_2,peaty_3,peaty_4,peaty_5,rich_0,rich_1,rich_2,rich_3,rich_4,rich_5,salty_0,salty_1,salty_2,salty_3,salty_4,salty_5,smoky_0,smoky_1,smoky_2,smoky_3,smoky_4,smoky_5,spicy_0,spicy_1,spicy_2,spicy_3,spicy_4,spicy_5,sweet_0,sweet_1,sweet_2,sweet_3,sweet_4,sweet_5,tart_0,tart_1,tart_2,tart_3,tart_4,tart_5,vanilla_0,vanilla_1,vanilla_2,vanilla_3,vanilla_4,vanilla_5
count,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0,3513.0
mean,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
std,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
min,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
25%,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
50%,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
75%,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,1.0,0.0,0.0,1.0,0.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,1.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,1.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0
max,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,0.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0


In [198]:
tasting_notes_len = []

for item in df2['tasting_notes']:
    tasting_notes_len.append(len(item))
    
print(sum(tasting_notes_len))
    
pd.Series(tasting_notes_len).describe()

1336298


count    3513.000000
mean      380.386564
std       104.685472
min       110.000000
25%       310.000000
50%       366.000000
75%       435.000000
max       903.000000
dtype: float64

In [22]:
pandas_profiling.ProfileReport(df2)

  variable_stats = pd.concat(ldesc, join_axes=pd.Index([names]), axis=1)


0,1
Number of variables,32
Number of observations,3451
Total Missing (%),0.0%
Total size in memory,862.9 KiB
Average record size in memory,256.0 B

0,1
Numeric,30
Categorical,2
Boolean,0
Date,0
Text (Unique),0
Rejected,0
Unsupported,0

0,1
Distinct count,3451
Unique (%),100.0%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,1725
Minimum,0
Maximum,3450
Zeros (%),0.0%

0,1
Minimum,0.0
5-th percentile,172.5
Q1,862.5
Median,1725.0
Q3,2587.5
95-th percentile,3277.5
Maximum,3450.0
Range,3450.0
Interquartile range,1725.0

0,1
Standard deviation,996.36
Coef of variation,0.5776
Kurtosis,-1.2
Mean,1725
MAD,862.75
Skewness,0
Sum,5952975
Variance,992740
Memory size,27.1 KiB

Value,Count,Frequency (%),Unnamed: 3
2047,1,0.0%,
589,1,0.0%,
585,1,0.0%,
2632,1,0.0%,
581,1,0.0%,
2628,1,0.0%,
577,1,0.0%,
2624,1,0.0%,
573,1,0.0%,
2620,1,0.0%,

Value,Count,Frequency (%),Unnamed: 3
0,1,0.0%,
1,1,0.0%,
2,1,0.0%,
3,1,0.0%,
4,1,0.0%,

Value,Count,Frequency (%),Unnamed: 3
3446,1,0.0%,
3447,1,0.0%,
3448,1,0.0%,
3449,1,0.0%,
3450,1,0.0%,

0,1
Distinct count,43
Unique (%),1.2%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,86.668
Minimum,40
Maximum,99
Zeros (%),0.0%

0,1
Minimum,40
5-th percentile,77
Q1,84
Median,87
Q3,90
95-th percentile,95
Maximum,99
Range,59
Interquartile range,6

0,1
Standard deviation,5.7457
Coef of variation,0.066295
Kurtosis,3.3787
Mean,86.668
MAD,4.3907
Skewness,-1.0996
Sum,299090
Variance,33.013
Memory size,27.1 KiB

Value,Count,Frequency (%),Unnamed: 3
90,320,9.3%,
88,304,8.8%,
87,265,7.7%,
89,245,7.1%,
92,209,6.1%,
86,206,6.0%,
84,204,5.9%,
85,203,5.9%,
91,190,5.5%,
83,157,4.5%,

Value,Count,Frequency (%),Unnamed: 3
40,1,0.0%,
50,1,0.0%,
54,1,0.0%,
55,2,0.1%,
58,1,0.0%,

Value,Count,Frequency (%),Unnamed: 3
95,73,2.1%,
96,64,1.9%,
97,31,0.9%,
98,16,0.5%,
99,5,0.1%,

0,1
Distinct count,7
Unique (%),0.2%
Missing (%),0.0%
Missing (n),0

0,1
Whiskey,2095
Rum,352
Tequila,307
Other values (4),697

Value,Count,Frequency (%),Unnamed: 3
Whiskey,2095,60.7%,
Rum,352,10.2%,
Tequila,307,8.9%,
Brandy,276,8.0%,
Gin,271,7.9%,
Liqueurs/Bitters,76,2.2%,
Vodka,74,2.1%,

0,1
Distinct count,3442
Unique (%),99.7%
Missing (%),0.0%
Missing (n),0

0,1
"The nose is sweet with honey, vanilla, and a touch of spice. The palate has even more sweet corn, with a slight rye spice flavor and more honey. The finish is longer than one might expect with more brown sugar and oak.",2
"Upon nosing this whisky, you'll get grapes and nuts with vanilla and honey to follow. The whisky is slightly chewy in the middle and finishes with gentle wood spice and raisins. It's a classic for a reason and a good measure of the entire collection Balvenie creates.",2
"The rose scent comes through loud and clear on the aroma. Juniper and bright coriander follow soon after, but cucumber joins in the party once you taste. Overall, not too earthy and the spices are moderate and only slightly bitter. The gin isn't bold and brash so look elsewhere for the punch of juniper. The goal of the gin seems to have been met which was a British garden tea party. Speaking of daytime drinking, try this in a Corpse Reviver #2 to revive you from the previous evening.",2
Other values (3439),3445

Value,Count,Frequency (%),Unnamed: 3
"The nose is sweet with honey, vanilla, and a touch of spice. The palate has even more sweet corn, with a slight rye spice flavor and more honey. The finish is longer than one might expect with more brown sugar and oak.",2,0.1%,
"Upon nosing this whisky, you'll get grapes and nuts with vanilla and honey to follow. The whisky is slightly chewy in the middle and finishes with gentle wood spice and raisins. It's a classic for a reason and a good measure of the entire collection Balvenie creates.",2,0.1%,
"The rose scent comes through loud and clear on the aroma. Juniper and bright coriander follow soon after, but cucumber joins in the party once you taste. Overall, not too earthy and the spices are moderate and only slightly bitter. The gin isn't bold and brash so look elsewhere for the punch of juniper. The goal of the gin seems to have been met which was a British garden tea party. Speaking of daytime drinking, try this in a Corpse Reviver #2 to revive you from the previous evening.",2,0.1%,
"This is a familiar rye with textbook floral notes on the nose. Popping toasted grains swirl with oaky vanilla leading your mouth on a journey of rye spiciness and creamy caramel. Orange citrus mixed with baking spices, such as clove and hot cinnamon, hang around a long time like they’ve been charged by the Energizer Bunny. This whisky is a prodigy for cocktails but just as delicious as a sipper.",2,0.1%,
"The Black Label is definitely known as the peated Johnnie, but what people don't discuss much are all the other goodies in the stocking. The nose displays vanilla cream, citrus zest, and nectarine and as you continue the journey, toasted malt, butterscotch, and golden raisins are there to greet you. The peat smoke present and accounted for, but is a smoldering fire at best.",2,0.1%,
"The whisky is fashionably late to show up, but what an impression it makes when it finally does. There's not much on the nose, initially, except raisins and a wisp of smoke. You taste it and the whisky is still playing coy, and then BAM! The flavors completely flood your palate. Dried fruits, nuts, cereal, dark chocolate, dark honey, violets, dried herbs--the list seems endless. The pleasant aftertaste lingers with lightly charred smoke and fruity sherry notes.",2,0.1%,
"This is a slow to get going whisky, but once it has an opportunity to sit in the glass for just a minute, it really opens up. The dark sherried notes come through on the nose, but also checking in for a visit are honey, orange peels, and cooked apples. Some dark chocolate and cinnamon appear and chewy oak tannins arrive fashionably late to the party.",2,0.1%,
The aroma are unmistakably markers for the American wood aging with aromas of vanilla and coconut. Cinnamon and ginger are in attendance and there is a beeswax quality to the texture and taste of the whisky.,2,0.1%,
The sweet aroma is very inviting and draws you in closer to inspect the dram. The honey'd and vanilla fragrance takes a turn on the palate replaced by grass and pineapple. A lemon twist or two comes next with the peat smoke just teasing your senses.,2,0.1%,
"This blend plays up to its name quite well with an enjoyable mix of peat smoke and spice from start to finish. The aromas are lead by a waft of (almost Mediterranean) baking spices and backed up by toasted nut and chili flake notes. The palate is immediately coating and brings a layered mix of caramelized sugar, dried apricot and lean peat smoke. The chili flake note returns for a nice accent at the end.",1,0.0%,

0,1
Distinct count,5
Unique (%),0.1%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,0.34628
Minimum,0
Maximum,4
Zeros (%),82.2%

0,1
Minimum,0
5-th percentile,0
Q1,0
Median,0
Q3,0
95-th percentile,2
Maximum,4
Range,4
Interquartile range,0

0,1
Standard deviation,0.83842
Coef of variation,2.4213
Kurtosis,5.9222
Mean,0.34628
MAD,0.56913
Skewness,2.5551
Sum,1195
Variance,0.70296
Memory size,27.1 KiB

Value,Count,Frequency (%),Unnamed: 3
0,2836,82.2%,
2,234,6.8%,
1,231,6.7%,
3,104,3.0%,
4,46,1.3%,

Value,Count,Frequency (%),Unnamed: 3
0,2836,82.2%,
1,231,6.7%,
2,234,6.8%,
3,104,3.0%,
4,46,1.3%,

Value,Count,Frequency (%),Unnamed: 3
0,2836,82.2%,
1,231,6.7%,
2,234,6.8%,
3,104,3.0%,
4,46,1.3%,

0,1
Distinct count,5
Unique (%),0.1%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,2.5462
Minimum,0
Maximum,4
Zeros (%),0.7%

0,1
Minimum,0
5-th percentile,1
Q1,2
Median,3
Q3,3
95-th percentile,4
Maximum,4
Range,4
Interquartile range,1

0,1
Standard deviation,0.89756
Coef of variation,0.35251
Kurtosis,-0.48963
Mean,2.5462
MAD,0.76914
Skewness,-0.16278
Sum,8787
Variance,0.80562
Memory size,27.1 KiB

Value,Count,Frequency (%),Unnamed: 3
3,1342,38.9%,
2,1193,34.6%,
4,494,14.3%,
1,399,11.6%,
0,23,0.7%,

Value,Count,Frequency (%),Unnamed: 3
0,23,0.7%,
1,399,11.6%,
2,1193,34.6%,
3,1342,38.9%,
4,494,14.3%,

Value,Count,Frequency (%),Unnamed: 3
0,23,0.7%,
1,399,11.6%,
2,1193,34.6%,
3,1342,38.9%,
4,494,14.3%,

0,1
Distinct count,5
Unique (%),0.1%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,2.1666
Minimum,0
Maximum,4
Zeros (%),3.3%

0,1
Minimum,0
5-th percentile,1
Q1,2
Median,2
Q3,3
95-th percentile,4
Maximum,4
Range,4
Interquartile range,1

0,1
Standard deviation,0.94688
Coef of variation,0.43703
Kurtosis,-0.40726
Mean,2.1666
MAD,0.75605
Skewness,-0.056407
Sum,7477
Variance,0.89658
Memory size,27.1 KiB

Value,Count,Frequency (%),Unnamed: 3
2,1363,39.5%,
3,1011,29.3%,
1,710,20.6%,
4,252,7.3%,
0,115,3.3%,

Value,Count,Frequency (%),Unnamed: 3
0,115,3.3%,
1,710,20.6%,
2,1363,39.5%,
3,1011,29.3%,
4,252,7.3%,

Value,Count,Frequency (%),Unnamed: 3
0,115,3.3%,
1,710,20.6%,
2,1363,39.5%,
3,1011,29.3%,
4,252,7.3%,

0,1
Distinct count,5
Unique (%),0.1%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,2.3764
Minimum,0
Maximum,4
Zeros (%),2.6%

0,1
Minimum,0
5-th percentile,1
Q1,2
Median,2
Q3,3
95-th percentile,4
Maximum,4
Range,4
Interquartile range,1

0,1
Standard deviation,1.0201
Coef of variation,0.42926
Kurtosis,-0.65634
Mean,2.3764
MAD,0.86743
Skewness,-0.12269
Sum,8201
Variance,1.0406
Memory size,27.1 KiB

Value,Count,Frequency (%),Unnamed: 3
2,1151,33.4%,
3,1088,31.5%,
1,619,17.9%,
4,504,14.6%,
0,89,2.6%,

Value,Count,Frequency (%),Unnamed: 3
0,89,2.6%,
1,619,17.9%,
2,1151,33.4%,
3,1088,31.5%,
4,504,14.6%,

Value,Count,Frequency (%),Unnamed: 3
0,89,2.6%,
1,619,17.9%,
2,1151,33.4%,
3,1088,31.5%,
4,504,14.6%,

0,1
Distinct count,5
Unique (%),0.1%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,0.051289
Minimum,0
Maximum,4
Zeros (%),95.5%

0,1
Minimum,0
5-th percentile,0
Q1,0
Median,0
Q3,0
95-th percentile,0
Maximum,4
Range,4
Interquartile range,0

0,1
Standard deviation,0.25928
Coef of variation,5.0551
Kurtosis,56.413
Mean,0.051289
MAD,0.098001
Skewness,6.5369
Sum,177
Variance,0.067224
Memory size,27.1 KiB

Value,Count,Frequency (%),Unnamed: 3
0,3297,95.5%,
1,139,4.0%,
2,8,0.2%,
3,6,0.2%,
4,1,0.0%,

Value,Count,Frequency (%),Unnamed: 3
0,3297,95.5%,
1,139,4.0%,
2,8,0.2%,
3,6,0.2%,
4,1,0.0%,

Value,Count,Frequency (%),Unnamed: 3
0,3297,95.5%,
1,139,4.0%,
2,8,0.2%,
3,6,0.2%,
4,1,0.0%,

0,1
Distinct count,5
Unique (%),0.1%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,1.2286
Minimum,0
Maximum,4
Zeros (%),24.2%

0,1
Minimum,0
5-th percentile,0
Q1,1
Median,1
Q3,2
95-th percentile,3
Maximum,4
Range,4
Interquartile range,1

0,1
Standard deviation,0.92668
Coef of variation,0.75424
Kurtosis,-0.54536
Mean,1.2286
MAD,0.76884
Skewness,0.32354
Sum,4240
Variance,0.85873
Memory size,27.1 KiB

Value,Count,Frequency (%),Unnamed: 3
1,1310,38.0%,
2,1006,29.2%,
0,836,24.2%,
3,278,8.1%,
4,21,0.6%,

Value,Count,Frequency (%),Unnamed: 3
0,836,24.2%,
1,1310,38.0%,
2,1006,29.2%,
3,278,8.1%,
4,21,0.6%,

Value,Count,Frequency (%),Unnamed: 3
0,836,24.2%,
1,1310,38.0%,
2,1006,29.2%,
3,278,8.1%,
4,21,0.6%,

0,1
Distinct count,5
Unique (%),0.1%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,2.4857
Minimum,0
Maximum,4
Zeros (%),1.0%

0,1
Minimum,0
5-th percentile,1
Q1,2
Median,2
Q3,3
95-th percentile,4
Maximum,4
Range,4
Interquartile range,1

0,1
Standard deviation,0.88138
Coef of variation,0.35458
Kurtosis,-0.33914
Mean,2.4857
MAD,0.75356
Skewness,-0.10253
Sum,8578
Variance,0.77682
Memory size,27.1 KiB

Value,Count,Frequency (%),Unnamed: 3
2,1346,39.0%,
3,1262,36.6%,
4,430,12.5%,
1,380,11.0%,
0,33,1.0%,

Value,Count,Frequency (%),Unnamed: 3
0,33,1.0%,
1,380,11.0%,
2,1346,39.0%,
3,1262,36.6%,
4,430,12.5%,

Value,Count,Frequency (%),Unnamed: 3
0,33,1.0%,
1,380,11.0%,
2,1346,39.0%,
3,1262,36.6%,
4,430,12.5%,

0,1
Distinct count,5
Unique (%),0.1%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,1.3544
Minimum,0
Maximum,4
Zeros (%),40.1%

0,1
Minimum,0
5-th percentile,0
Q1,0
Median,1
Q3,2
95-th percentile,3
Maximum,4
Range,4
Interquartile range,2

0,1
Standard deviation,1.2729
Coef of variation,0.9398
Kurtosis,-1.2587
Mean,1.3544
MAD,1.1574
Skewness,0.28165
Sum,4674
Variance,1.6202
Memory size,27.1 KiB

Value,Count,Frequency (%),Unnamed: 3
0,1383,40.1%,
2,959,27.8%,
3,630,18.3%,
1,350,10.1%,
4,129,3.7%,

Value,Count,Frequency (%),Unnamed: 3
0,1383,40.1%,
1,350,10.1%,
2,959,27.8%,
3,630,18.3%,
4,129,3.7%,

Value,Count,Frequency (%),Unnamed: 3
0,1383,40.1%,
1,350,10.1%,
2,959,27.8%,
3,630,18.3%,
4,129,3.7%,

0,1
Distinct count,5
Unique (%),0.1%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,1.6132
Minimum,0
Maximum,4
Zeros (%),9.2%

0,1
Minimum,0
5-th percentile,0
Q1,1
Median,2
Q3,2
95-th percentile,3
Maximum,4
Range,4
Interquartile range,1

0,1
Standard deviation,0.93383
Coef of variation,0.57889
Kurtosis,-0.087631
Mean,1.6132
MAD,0.78225
Skewness,0.40327
Sum,5567
Variance,0.87205
Memory size,27.1 KiB

Value,Count,Frequency (%),Unnamed: 3
1,1370,39.7%,
2,1210,35.1%,
3,443,12.8%,
0,316,9.2%,
4,112,3.2%,

Value,Count,Frequency (%),Unnamed: 3
0,316,9.2%,
1,1370,39.7%,
2,1210,35.1%,
3,443,12.8%,
4,112,3.2%,

Value,Count,Frequency (%),Unnamed: 3
0,316,9.2%,
1,1370,39.7%,
2,1210,35.1%,
3,443,12.8%,
4,112,3.2%,

0,1
Distinct count,5
Unique (%),0.1%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,0.028398
Minimum,0
Maximum,4
Zeros (%),97.7%

0,1
Minimum,0
5-th percentile,0
Q1,0
Median,0
Q3,0
95-th percentile,0
Maximum,4
Range,4
Interquartile range,0

0,1
Standard deviation,0.20375
Coef of variation,7.1747
Kurtosis,105.36
Mean,0.028398
MAD,0.055495
Skewness,9.1116
Sum,98
Variance,0.041512
Memory size,27.1 KiB

Value,Count,Frequency (%),Unnamed: 3
0,3372,97.7%,
1,64,1.9%,
2,12,0.3%,
3,2,0.1%,
4,1,0.0%,

Value,Count,Frequency (%),Unnamed: 3
0,3372,97.7%,
1,64,1.9%,
2,12,0.3%,
3,2,0.1%,
4,1,0.0%,

Value,Count,Frequency (%),Unnamed: 3
0,3372,97.7%,
1,64,1.9%,
2,12,0.3%,
3,2,0.1%,
4,1,0.0%,

0,1
Distinct count,5
Unique (%),0.1%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,0.14836
Minimum,0
Maximum,4
Zeros (%),92.4%

0,1
Minimum,0
5-th percentile,0
Q1,0
Median,0
Q3,0
95-th percentile,1
Maximum,4
Range,4
Interquartile range,0

0,1
Standard deviation,0.58929
Coef of variation,3.9719
Kurtosis,21.312
Mean,0.14836
MAD,0.27411
Skewness,4.5374
Sum,512
Variance,0.34726
Memory size,27.1 KiB

Value,Count,Frequency (%),Unnamed: 3
0,3188,92.4%,
1,120,3.5%,
2,63,1.8%,
3,54,1.6%,
4,26,0.8%,

Value,Count,Frequency (%),Unnamed: 3
0,3188,92.4%,
1,120,3.5%,
2,63,1.8%,
3,54,1.6%,
4,26,0.8%,

Value,Count,Frequency (%),Unnamed: 3
0,3188,92.4%,
1,120,3.5%,
2,63,1.8%,
3,54,1.6%,
4,26,0.8%,

0,1
Distinct count,5
Unique (%),0.1%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,0.14691
Minimum,0
Maximum,4
Zeros (%),91.7%

0,1
Minimum,0
5-th percentile,0
Q1,0
Median,0
Q3,0
95-th percentile,1
Maximum,4
Range,4
Interquartile range,0

0,1
Standard deviation,0.55129
Coef of variation,3.7524
Kurtosis,20.035
Mean,0.14691
MAD,0.26956
Skewness,4.3274
Sum,507
Variance,0.30392
Memory size,27.1 KiB

Value,Count,Frequency (%),Unnamed: 3
0,3166,91.7%,
1,132,3.8%,
2,101,2.9%,
3,35,1.0%,
4,17,0.5%,

Value,Count,Frequency (%),Unnamed: 3
0,3166,91.7%,
1,132,3.8%,
2,101,2.9%,
3,35,1.0%,
4,17,0.5%,

Value,Count,Frequency (%),Unnamed: 3
0,3166,91.7%,
1,132,3.8%,
2,101,2.9%,
3,35,1.0%,
4,17,0.5%,

0,1
Distinct count,5
Unique (%),0.1%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,0.16314
Minimum,0
Maximum,4
Zeros (%),92.2%

0,1
Minimum,0
5-th percentile,0
Q1,0
Median,0
Q3,0
95-th percentile,2
Maximum,4
Range,4
Interquartile range,0

0,1
Standard deviation,0.61081
Coef of variation,3.7441
Kurtosis,15.75
Mean,0.16314
MAD,0.30094
Skewness,3.9886
Sum,563
Variance,0.37309
Memory size,27.1 KiB

Value,Count,Frequency (%),Unnamed: 3
0,3183,92.2%,
2,114,3.3%,
1,71,2.1%,
3,68,2.0%,
4,15,0.4%,

Value,Count,Frequency (%),Unnamed: 3
0,3183,92.2%,
1,71,2.1%,
2,114,3.3%,
3,68,2.0%,
4,15,0.4%,

Value,Count,Frequency (%),Unnamed: 3
0,3183,92.2%,
1,71,2.1%,
2,114,3.3%,
3,68,2.0%,
4,15,0.4%,

0,1
Distinct count,5
Unique (%),0.1%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,0.037091
Minimum,0
Maximum,4
Zeros (%),98.4%

0,1
Minimum,0
5-th percentile,0
Q1,0
Median,0
Q3,0
95-th percentile,0
Maximum,4
Range,4
Interquartile range,0

0,1
Standard deviation,0.32449
Coef of variation,8.7484
Kurtosis,101.38
Mean,0.037091
MAD,0.072999
Skewness,9.808
Sum,128
Variance,0.10529
Memory size,27.1 KiB

Value,Count,Frequency (%),Unnamed: 3
0,3396,98.4%,
1,18,0.5%,
3,14,0.4%,
2,12,0.3%,
4,11,0.3%,

Value,Count,Frequency (%),Unnamed: 3
0,3396,98.4%,
1,18,0.5%,
2,12,0.3%,
3,14,0.4%,
4,11,0.3%,

Value,Count,Frequency (%),Unnamed: 3
0,3396,98.4%,
1,18,0.5%,
2,12,0.3%,
3,14,0.4%,
4,11,0.3%,

0,1
Distinct count,5
Unique (%),0.1%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,0.34309
Minimum,0
Maximum,4
Zeros (%),78.2%

0,1
Minimum,0
5-th percentile,0
Q1,0
Median,0
Q3,0
95-th percentile,2
Maximum,4
Range,4
Interquartile range,0

0,1
Standard deviation,0.75944
Coef of variation,2.2135
Kurtosis,6.2742
Mean,0.34309
MAD,0.53626
Skewness,2.5298
Sum,1184
Variance,0.57675
Memory size,27.1 KiB

Value,Count,Frequency (%),Unnamed: 3
0,2697,78.2%,
1,478,13.9%,
2,144,4.2%,
3,110,3.2%,
4,22,0.6%,

Value,Count,Frequency (%),Unnamed: 3
0,2697,78.2%,
1,478,13.9%,
2,144,4.2%,
3,110,3.2%,
4,22,0.6%,

Value,Count,Frequency (%),Unnamed: 3
0,2697,78.2%,
1,478,13.9%,
2,144,4.2%,
3,110,3.2%,
4,22,0.6%,

0,1
Distinct count,5
Unique (%),0.1%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,0.5778
Minimum,0
Maximum,4
Zeros (%),66.4%

0,1
Minimum,0
5-th percentile,0
Q1,0
Median,0
Q3,1
95-th percentile,3
Maximum,4
Range,4
Interquartile range,1

0,1
Standard deviation,0.95399
Coef of variation,1.6511
Kurtosis,1.8022
Mean,0.5778
MAD,0.76717
Skewness,1.636
Sum,1994
Variance,0.9101
Memory size,27.1 KiB

Value,Count,Frequency (%),Unnamed: 3
0,2291,66.4%,
1,603,17.5%,
2,318,9.2%,
3,201,5.8%,
4,38,1.1%,

Value,Count,Frequency (%),Unnamed: 3
0,2291,66.4%,
1,603,17.5%,
2,318,9.2%,
3,201,5.8%,
4,38,1.1%,

Value,Count,Frequency (%),Unnamed: 3
0,2291,66.4%,
1,603,17.5%,
2,318,9.2%,
3,201,5.8%,
4,38,1.1%,

0,1
Distinct count,5
Unique (%),0.1%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,0.099971
Minimum,0
Maximum,4
Zeros (%),93.6%

0,1
Minimum,0
5-th percentile,0
Q1,0
Median,0
Q3,0
95-th percentile,1
Maximum,4
Range,4
Interquartile range,0

0,1
Standard deviation,0.43888
Coef of variation,4.39
Kurtosis,33.454
Mean,0.099971
MAD,0.18714
Skewness,5.4286
Sum,345
Variance,0.19261
Memory size,27.1 KiB

Value,Count,Frequency (%),Unnamed: 3
0,3230,93.6%,
1,140,4.1%,
2,48,1.4%,
3,23,0.7%,
4,10,0.3%,

Value,Count,Frequency (%),Unnamed: 3
0,3230,93.6%,
1,140,4.1%,
2,48,1.4%,
3,23,0.7%,
4,10,0.3%,

Value,Count,Frequency (%),Unnamed: 3
0,3230,93.6%,
1,140,4.1%,
2,48,1.4%,
3,23,0.7%,
4,10,0.3%,

0,1
Distinct count,5
Unique (%),0.1%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,0.24225
Minimum,0
Maximum,4
Zeros (%),85.9%

0,1
Minimum,0
5-th percentile,0
Q1,0
Median,0
Q3,0
95-th percentile,2
Maximum,4
Range,4
Interquartile range,0

0,1
Standard deviation,0.68004
Coef of variation,2.8072
Kurtosis,10.103
Mean,0.24225
MAD,0.41627
Skewness,3.1589
Sum,836
Variance,0.46246
Memory size,27.1 KiB

Value,Count,Frequency (%),Unnamed: 3
0,2965,85.9%,
1,246,7.1%,
2,151,4.4%,
3,68,2.0%,
4,21,0.6%,

Value,Count,Frequency (%),Unnamed: 3
0,2965,85.9%,
1,246,7.1%,
2,151,4.4%,
3,68,2.0%,
4,21,0.6%,

Value,Count,Frequency (%),Unnamed: 3
0,2965,85.9%,
1,246,7.1%,
2,151,4.4%,
3,68,2.0%,
4,21,0.6%,

0,1
Distinct count,5
Unique (%),0.1%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,0.60417
Minimum,0
Maximum,4
Zeros (%),58.6%

0,1
Minimum,0
5-th percentile,0
Q1,0
Median,0
Q3,1
95-th percentile,2
Maximum,4
Range,4
Interquartile range,1

0,1
Standard deviation,0.85623
Coef of variation,1.4172
Kurtosis,1.7149
Mean,0.60417
MAD,0.70834
Skewness,1.457
Sum,2085
Variance,0.73313
Memory size,27.1 KiB

Value,Count,Frequency (%),Unnamed: 3
0,2023,58.6%,
1,944,27.4%,
2,333,9.6%,
3,129,3.7%,
4,22,0.6%,

Value,Count,Frequency (%),Unnamed: 3
0,2023,58.6%,
1,944,27.4%,
2,333,9.6%,
3,129,3.7%,
4,22,0.6%,

Value,Count,Frequency (%),Unnamed: 3
0,2023,58.6%,
1,944,27.4%,
2,333,9.6%,
3,129,3.7%,
4,22,0.6%,

0,1
Distinct count,5
Unique (%),0.1%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,0.25616
Minimum,0
Maximum,4
Zeros (%),83.2%

0,1
Minimum,0
5-th percentile,0
Q1,0
Median,0
Q3,0
95-th percentile,2
Maximum,4
Range,4
Interquartile range,0

0,1
Standard deviation,0.64416
Coef of variation,2.5147
Kurtosis,8.1975
Mean,0.25616
MAD,0.42621
Skewness,2.8275
Sum,884
Variance,0.41494
Memory size,27.1 KiB

Value,Count,Frequency (%),Unnamed: 3
0,2871,83.2%,
1,349,10.1%,
2,168,4.9%,
3,53,1.5%,
4,10,0.3%,

Value,Count,Frequency (%),Unnamed: 3
0,2871,83.2%,
1,349,10.1%,
2,168,4.9%,
3,53,1.5%,
4,10,0.3%,

Value,Count,Frequency (%),Unnamed: 3
0,2871,83.2%,
1,349,10.1%,
2,168,4.9%,
3,53,1.5%,
4,10,0.3%,

0,1
Distinct count,5
Unique (%),0.1%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,1.5459
Minimum,0
Maximum,4
Zeros (%),39.6%

0,1
Minimum,0
5-th percentile,0
Q1,0
Median,2
Q3,3
95-th percentile,4
Maximum,4
Range,4
Interquartile range,3

0,1
Standard deviation,1.3927
Coef of variation,0.90087
Kurtosis,-1.4447
Mean,1.5459
MAD,1.2716
Skewness,0.11717
Sum,5335
Variance,1.9396
Memory size,27.1 KiB

Value,Count,Frequency (%),Unnamed: 3
0,1366,39.6%,
2,854,24.7%,
3,844,24.5%,
4,236,6.8%,
1,151,4.4%,

Value,Count,Frequency (%),Unnamed: 3
0,1366,39.6%,
1,151,4.4%,
2,854,24.7%,
3,844,24.5%,
4,236,6.8%,

Value,Count,Frequency (%),Unnamed: 3
0,1366,39.6%,
1,151,4.4%,
2,854,24.7%,
3,844,24.5%,
4,236,6.8%,

0,1
Distinct count,5
Unique (%),0.1%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,0.020574
Minimum,0
Maximum,4
Zeros (%),98.8%

0,1
Minimum,0
5-th percentile,0
Q1,0
Median,0
Q3,0
95-th percentile,0
Maximum,4
Range,4
Interquartile range,0

0,1
Standard deviation,0.21233
Coef of variation,10.32
Kurtosis,185.84
Mean,0.020574
MAD,0.040647
Skewness,12.766
Sum,71
Variance,0.045084
Memory size,27.1 KiB

Value,Count,Frequency (%),Unnamed: 3
0,3409,98.8%,
1,24,0.7%,
2,10,0.3%,
3,5,0.1%,
4,3,0.1%,

Value,Count,Frequency (%),Unnamed: 3
0,3409,98.8%,
1,24,0.7%,
2,10,0.3%,
3,5,0.1%,
4,3,0.1%,

Value,Count,Frequency (%),Unnamed: 3
0,3409,98.8%,
1,24,0.7%,
2,10,0.3%,
3,5,0.1%,
4,3,0.1%,

0,1
Distinct count,5
Unique (%),0.1%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,0.32425
Minimum,0
Maximum,4
Zeros (%),82.3%

0,1
Minimum,0
5-th percentile,0
Q1,0
Median,0
Q3,0
95-th percentile,2
Maximum,4
Range,4
Interquartile range,0

0,1
Standard deviation,0.8022
Coef of variation,2.474
Kurtosis,6.8409
Mean,0.32425
MAD,0.53369
Skewness,2.6998
Sum,1119
Variance,0.64352
Memory size,27.1 KiB

Value,Count,Frequency (%),Unnamed: 3
0,2840,82.3%,
1,289,8.4%,
2,174,5.0%,
3,110,3.2%,
4,38,1.1%,

Value,Count,Frequency (%),Unnamed: 3
0,2840,82.3%,
1,289,8.4%,
2,174,5.0%,
3,110,3.2%,
4,38,1.1%,

Value,Count,Frequency (%),Unnamed: 3
0,2840,82.3%,
1,289,8.4%,
2,174,5.0%,
3,110,3.2%,
4,38,1.1%,

0,1
Distinct count,5
Unique (%),0.1%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,1.5868
Minimum,0
Maximum,4
Zeros (%),8.4%

0,1
Minimum,0
5-th percentile,0
Q1,1
Median,2
Q3,2
95-th percentile,3
Maximum,4
Range,4
Interquartile range,1

0,1
Standard deviation,0.87555
Coef of variation,0.55178
Kurtosis,0.12664
Mean,1.5868
MAD,0.73462
Skewness,0.37162
Sum,5476
Variance,0.7666
Memory size,27.1 KiB

Value,Count,Frequency (%),Unnamed: 3
1,1376,39.9%,
2,1339,38.8%,
3,362,10.5%,
0,290,8.4%,
4,84,2.4%,

Value,Count,Frequency (%),Unnamed: 3
0,290,8.4%,
1,1376,39.9%,
2,1339,38.8%,
3,362,10.5%,
4,84,2.4%,

Value,Count,Frequency (%),Unnamed: 3
0,290,8.4%,
1,1376,39.9%,
2,1339,38.8%,
3,362,10.5%,
4,84,2.4%,

0,1
Distinct count,5
Unique (%),0.1%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,1.6445
Minimum,0
Maximum,4
Zeros (%),1.0%

0,1
Minimum,0
5-th percentile,1
Q1,1
Median,1
Q3,2
95-th percentile,3
Maximum,4
Range,4
Interquartile range,1

0,1
Standard deviation,0.82158
Coef of variation,0.49961
Kurtosis,0.27744
Mean,1.6445
MAD,0.7019
Skewness,0.94557
Sum,5675
Variance,0.675
Memory size,27.1 KiB

Value,Count,Frequency (%),Unnamed: 3
1,1790,51.9%,
2,1094,31.7%,
3,431,12.5%,
4,101,2.9%,
0,35,1.0%,

Value,Count,Frequency (%),Unnamed: 3
0,35,1.0%,
1,1790,51.9%,
2,1094,31.7%,
3,431,12.5%,
4,101,2.9%,

Value,Count,Frequency (%),Unnamed: 3
0,35,1.0%,
1,1790,51.9%,
2,1094,31.7%,
3,431,12.5%,
4,101,2.9%,

0,1
Distinct count,5
Unique (%),0.1%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,0.39003
Minimum,0
Maximum,4
Zeros (%),71.1%

0,1
Minimum,0
5-th percentile,0
Q1,0
Median,0
Q3,1
95-th percentile,2
Maximum,4
Range,4
Interquartile range,1

0,1
Standard deviation,0.70547
Coef of variation,1.8087
Kurtosis,4.7688
Mean,0.39003
MAD,0.5547
Skewness,2.0784
Sum,1346
Variance,0.49769
Memory size,27.1 KiB

Value,Count,Frequency (%),Unnamed: 3
0,2454,71.1%,
1,730,21.2%,
2,202,5.9%,
3,48,1.4%,
4,17,0.5%,

Value,Count,Frequency (%),Unnamed: 3
0,2454,71.1%,
1,730,21.2%,
2,202,5.9%,
3,48,1.4%,
4,17,0.5%,

Value,Count,Frequency (%),Unnamed: 3
0,2454,71.1%,
1,730,21.2%,
2,202,5.9%,
3,48,1.4%,
4,17,0.5%,

0,1
Distinct count,5
Unique (%),0.1%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,0.056216
Minimum,0
Maximum,4
Zeros (%),96.4%

0,1
Minimum,0
5-th percentile,0
Q1,0
Median,0
Q3,0
95-th percentile,0
Maximum,4
Range,4
Interquartile range,0

0,1
Standard deviation,0.33669
Coef of variation,5.9893
Kurtosis,66.189
Mean,0.056216
MAD,0.10839
Skewness,7.5792
Sum,194
Variance,0.11336
Memory size,27.1 KiB

Value,Count,Frequency (%),Unnamed: 3
0,3327,96.4%,
1,81,2.3%,
2,23,0.7%,
3,13,0.4%,
4,7,0.2%,

Value,Count,Frequency (%),Unnamed: 3
0,3327,96.4%,
1,81,2.3%,
2,23,0.7%,
3,13,0.4%,
4,7,0.2%,

Value,Count,Frequency (%),Unnamed: 3
0,3327,96.4%,
1,81,2.3%,
2,23,0.7%,
3,13,0.4%,
4,7,0.2%,

0,1
Distinct count,5
Unique (%),0.1%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,1.1214
Minimum,0
Maximum,4
Zeros (%),31.0%

0,1
Minimum,0
5-th percentile,0
Q1,0
Median,1
Q3,2
95-th percentile,3
Maximum,4
Range,4
Interquartile range,2

0,1
Standard deviation,0.99828
Coef of variation,0.8902
Kurtosis,-0.091094
Mean,1.1214
MAD,0.78675
Skewness,0.68057
Sum,3870
Variance,0.99656
Memory size,27.1 KiB

Value,Count,Frequency (%),Unnamed: 3
1,1289,37.4%,
0,1071,31.0%,
2,757,21.9%,
3,269,7.8%,
4,65,1.9%,

Value,Count,Frequency (%),Unnamed: 3
0,1071,31.0%,
1,1289,37.4%,
2,757,21.9%,
3,269,7.8%,
4,65,1.9%,

Value,Count,Frequency (%),Unnamed: 3
0,1071,31.0%,
1,1289,37.4%,
2,757,21.9%,
3,269,7.8%,
4,65,1.9%,

Unnamed: 0,id,rating,category,tasting_note,woody,sweet,spicy,fruity,harsh,tart,rich,vanilla,herbal,chemical,umami,hogo,juniper,neutral,mineral,earthy,nutty,roast,salty,bitter,full_bodied,grain,peaty,oily,floral,briny,rancio,smoky
0,0,99,Brandy,"A stellar bottle of brandy. Classic cognac flavors of French vanilla, dried violets, and exotic marmalade are joined by rich toffee and spice. Perhaps most importantly, there is also a deep, savory rancio aspect -- the French term to describe a noble oxidation present after long exposure to air and casks. Unlike many other cognacs that are this age on the market, the fruit is still solidly intact and the oak adds spice and complexity, not tannin and bitterness. World classic cognac for lovers of grace and beauty, not necessarily heft and power.",2,3,1,4,0,1,2,0,1,0,0,0,0,0,0,1,3,1,0,0,0,0,0,1,2,0,4,1
1,1,99,Brandy,"The best Calvados retain an apple fruit quality in a way that the best Armagnac and Cognac do not reflect with grape. The aromatics here soar with a pure orchard fruit that shifts back and forth from luscious, candied, apple preserves and more savory autumn flavors of wood smoke. The 53% alcohol never betrays itself and the spirit is surprisingly drinkable for its strength and concentration. In a similar trick, the 18 years in wood have left only the slightest hint of oak tannin and seems to have focused and enhanced the fruit instead of obscuring it with vanilla. Highest recommendation, best in class.",1,4,1,4,0,1,3,0,1,0,0,0,0,0,0,1,2,1,0,0,0,0,0,3,1,0,1,1
2,2,99,Whiskey,"Tasting this whisky was one of those moments where your surroundings come to a halt and all of your senses are heightened. There is a beautiful marriage of grain and fruit expressed in this whisky. The sherry casks are quite evident with stone fruit and cherry mixed with warm baking spices and a light floral incense. The malt, however, is standing firm and not being over-powered by the fruit. There is a gentle wisp of smoke with the finish and it acts much like adding salt and pepper to your dish. Kudos to their master blender for a harmonious and elegant whisky.",0,4,2,4,0,1,4,1,2,0,0,0,0,0,0,0,0,0,1,0,4,0,4,1,2,0,0,2
3,3,99,Whiskey,"The sweet smoke is the underlying feature in this whisky but the complexity of the dram is what is most enjoyable. Among the many notes found were oyster mushrooms, fresh cut apples, kelp, cigar ash, honey, sea salt, and smoked bacon. Velvety and indulgent, the whisky finishes on the dry side with mouthwatering acidity.",0,3,2,3,0,2,4,2,1,0,0,0,0,0,0,0,0,0,2,0,3,0,2,2,1,1,0,2
4,4,99,Gin,"Monkey 47 is an exquisite gin that pushes the boundaries of how much and what type of flavor a gin can have. The 47 ingredients build off of each other rather than contradict and the unlikely combination of forest fruit and exotic tones of wildflowers and island spices (especially on the balanced and long, rich finish) create a heady beverage that reveals more upon every sip. Juniper is present, but there is so many other flavors present that it is not nearly as dominant as in many more traditional gins. This is truly one of the world’s most complex gins and although we're sure that it would make wonderful cocktails, one should try it by its self to appreciate the full spectrum of flavors.",0,2,4,4,0,0,3,0,4,0,0,0,1,0,1,1,0,0,0,0,0,0,0,2,4,0,0,0
