In [1]:
%load_ext autoreload
%autoreload 2

In [2]:
import numpy as np
from scipy import stats
import pandas as pd
import seaborn as sns
import matplotlib.pyplot as plt
from IPython.display import display, HTML, Markdown, Latex, Image

from sklearn.model_selection import train_test_split

import markdown2
import tabulate

In [3]:
import pandas_explore as exp

In [4]:
# Titanic data
df_titanic = pd.read_csv('./data/titanic.csv').astype({'Survived':'object', 'Pclass':'object'})
df_titanic_train, df_titanic_test = train_test_split(df_titanic, test_size=0.2)
df_titanic_test = df_titanic_test.drop(columns=['Survived'])

In [5]:
# Diamonds data
df_diamonds = pd.read_csv('./data/diamonds.csv')
df_dia_train, df_dia_test = train_test_split(df_diamonds, test_size=0.2)

In [8]:
# stock
df_stock = pd.read_csv('./data/stock.csv').assign(Date = lambda df: pd.to_datetime(df['Date'], infer_datetime_format=True))

# Render Concept

1. Plot Render 함수
    - render_cat2cat
    - render_cat2num
    - render_num2cat
    - render_num2num


2. 단일 변수/데이터셋 Render 함수
    - render_variable
    - render_variable_info
    - render_dataset_info


3. 모델 유형별 Target 변수 변화량 Render 함수
    - render_target_by_feature_clf
    - render_target_by_feature_reg


4. 기타 도움 함수
    - render_cols_table
    - render_dict2table
    - render_list2table

## 1. Plot Render 함수

### 1.1 render_cat2cat

In [36]:
print(exp.render_cat2cat.__doc__)


    plot_cat2cat의 상위 함수로 normalized 여부에 따른 2개의 plot을 함께 보여준다.

    Arguments:
        df (Data Frame)
        cat_col (str)
        target_col (str)

    Returns:
        HTML 형식으로 노트북 화면에 표출한다.

    Example:
        >>> render_cat2cat(df_titanic_train, 'Pclass', 'Survived')
    


In [6]:
exp.render_cat2cat(df_titanic_train, 'Pclass', 'Survived')

0,1
"""Survived"" by ""Pclass""","""Survived"" by ""Pclass"""
Class Counts,Normalized Counts
,


### 1.2 render_cat2num

In [37]:
print(exp.render_cat2num.__doc__)


    plot_cat2num, plot_cat2pie의 상위 함수로 범주형 변수에 따른 수치 변수의 변화를 보여준다.

    Arguments:
        df (Data Frame)
        cat_col (str)
        target_col (str)

    Example:
        >>> render_cat2num(df_stock, cat_col='Weekday', target_col='Close')
    


In [38]:
exp.render_cat2num(df_titanic, cat_col='Pclass', target_col='Age')

0,1
"""Age"" Distribution by ""Pclass""","""Age"" Distribution by ""Pclass"""
,


### 1.3 render_num2cat

In [39]:
print(exp.render_num2cat.__doc__)


    plot_num2cat의 상위 함수로 multiple 옵션에 따른 2개의 plot을 함께 보여준다.

    Arguments:
        df (Data Frame)
        num_col (str)
        target_col (str)

    Example:
        >>> render_num2cat(df_titanic_train, 'Age', 'Survived')
    


In [7]:
exp.render_num2cat(df_titanic_train, 'Age', 'Survived')

0,1
"""Survived"" by ""Age""","""Survived"" by ""Age"""
Class Distribution,Normalized Distribution
,


### 1.4 render_num2num

In [40]:
print(exp.render_num2num.__doc__)


    plot_num2num, plot_num2histd의 상위 함수이다.

    Example:
        >>> render_num2num(df_stock, num_col='Open', target_col='Close')
    


In [30]:
exp.render_num2num(df_diamonds, num_col='carat', target_col='price')

0,1,2
"""price"" Distribution by ""carat""","""price"" Distribution by ""carat""","""price"" Distribution by ""carat"""
,,


## 2. Dataset/Variable Render 함수

### 2.1 render_dataset_info

In [73]:
# 단일 데이터셋의 정보 확인
exp.render_dataset_info({
    'set_name': 'Diamonds', 
    'dfs': [{'df_name': 'Train', 'df': df_dia_train}], 
})

## Diamonds Datasets

0,1
Train statisticsNumber of variables10Number of observations43152Missing cells0Missing cells(%)0.0Duplicated rows91Duplicated rows(%)0.21,variable typesNumeric7Object3Category0Datetime0Timedeltas0

0,1
Train statistics,Train statistics
Number of variables,10
Number of observations,43152
Missing cells,0
Missing cells(%),0.0
Duplicated rows,91
Duplicated rows(%),0.21

0,1
variable types,variable types
Numeric,7
Object,3
Category,0
Datetime,0
Timedeltas,0


In [69]:
# 복수의 데이터셋의 정보 확인
exp.render_dataset_info({
    'set_name': 'Diamonds', 
    'dfs': [{'df_name': 'Train', 'df': df_dia_train}, {'df_name': 'Test', 'df': df_dia_test}], 
})

## Diamonds Datasets

0,1,2,3
Train statisticsNumber of variables10Number of observations43152Missing cells0Missing cells(%)0.0Duplicated rows91Duplicated rows(%)0.21,variable typesNumeric7Object3Category0Datetime0Timedeltas0,Test statisticsNumber of variables10Number of observations10788Missing cells0Missing cells(%)0.0Duplicated rows8Duplicated rows(%)0.074,variable typesNumeric7Object3Category0Datetime0Timedeltas0

0,1
Train statistics,Train statistics
Number of variables,10
Number of observations,43152
Missing cells,0
Missing cells(%),0.0
Duplicated rows,91
Duplicated rows(%),0.21

0,1
variable types,variable types
Numeric,7
Object,3
Category,0
Datetime,0
Timedeltas,0

0,1
Test statistics,Test statistics
Number of variables,10
Number of observations,10788
Missing cells,0
Missing cells(%),0.0
Duplicated rows,8
Duplicated rows(%),0.074

0,1
variable types,variable types
Numeric,7
Object,3
Category,0
Datetime,0
Timedeltas,0


### 2.2 render_variable

In [45]:
# 단일 변수의 정보를 출력
exp.render_variable(df_titanic, 'Age')

0,1,2,3,4,5,6
| Descriptive Stat. |,| Descriptive Stat. |,| Quantile Stat. |,| Common Values |,| Min Values |,| Max Values |,| Histogram |
size891distinct89distinct(%)9.99missing177missing(%)19.86minimum0.42maximum80.0,zeros0zeros(%)0.00mean29.70median28.00sum21205.17sd14.53skewness0.39,minimun0.425-th per.4.00Q120.12median28.0Q338.0095-th per.56.00maximum80.0,valuecountratio(%)24.0304.2022.0273.7018.0263.6019.0253.5030.0253.5028.0253.50,valuecountratio(%)0.4210.100.6710.100.7520.200.8320.200.9210.101.070.90,valuecountratio(%)66.010.1070.020.2070.510.1071.020.2074.010.1080.010.10,

0,1
size,891.0
distinct,89.0
distinct(%),9.99
missing,177.0
missing(%),19.86
minimum,0.42
maximum,80.0

0,1
zeros,0.0
zeros(%),0.0
mean,29.7
median,28.0
sum,21205.17
sd,14.53
skewness,0.39

0,1
minimun,0.42
5-th per.,4.0
Q1,20.12
median,28.0
Q3,38.0
95-th per.,56.0
maximum,80.0

0,1,2
value,count,ratio(%)
24.0,30,4.20
22.0,27,3.70
18.0,26,3.60
19.0,25,3.50
30.0,25,3.50
28.0,25,3.50

0,1,2
value,count,ratio(%)
0.42,1,0.10
0.67,1,0.10
0.75,2,0.20
0.83,2,0.20
0.92,1,0.10
1.0,7,0.90

0,1,2
value,count,ratio(%)
66.0,1,0.10
70.0,2,0.20
70.5,1,0.10
71.0,2,0.20
74.0,1,0.10
80.0,1,0.10


### 2.3 render_variables_info

In [78]:
exp.render_variables_info({
    'set_name': 'Diamonds', 
    'dfs': [{'df_name': 'Train', 'df': df_dia_train}], 
})

## Diamonds Variables

### 1. "carat"

0,1,2,3,4,5,6
| Descriptive Stat. |,| Descriptive Stat. |,| Quantile Stat. |,| Common Values |,| Min Values |,| Max Values |,| Histogram |
size43152distinct269distinct(%)0.62missing0missing(%)0.00minimum0.2maximum5.01,zeros0zeros(%)0.00mean0.80median0.70sum34356.38sd0.47skewness1.13,minimun0.25-th per.0.30Q10.40median0.7Q31.0495-th per.1.70maximum5.01,valuecountratio(%)0.320694.701.0118144.200.3118014.100.715863.600.3214863.401.012292.80,valuecountratio(%)0.290.000.2170.000.2250.000.232470.500.242170.500.251690.30,valuecountratio(%)3.6710.004.010.004.0120.004.1310.004.510.005.0110.00,

0,1
size,43152.0
distinct,269.0
distinct(%),0.62
missing,0.0
missing(%),0.0
minimum,0.2
maximum,5.01

0,1
zeros,0.0
zeros(%),0.0
mean,0.8
median,0.7
sum,34356.38
sd,0.47
skewness,1.13

0,1
minimun,0.2
5-th per.,0.3
Q1,0.4
median,0.7
Q3,1.04
95-th per.,1.7
maximum,5.01

0,1,2
value,count,ratio(%)
0.3,2069,4.70
1.01,1814,4.20
0.31,1801,4.10
0.7,1586,3.60
0.32,1486,3.40
1.0,1229,2.80

0,1,2
value,count,ratio(%)
0.2,9,0.00
0.21,7,0.00
0.22,5,0.00
0.23,247,0.50
0.24,217,0.50
0.25,169,0.30

0,1,2
value,count,ratio(%)
3.67,1,0.00
4.0,1,0.00
4.01,2,0.00
4.13,1,0.00
4.5,1,0.00
5.01,1,0.00


----------

### 2. "cut"

0,1,2,3
| Descriptive Statistics |,| Common Values |,| Bar Chart |,| Pie Chart |
size43152distinct5distinct(%)0.011missing0missing(%)0.0,valuecountratio(%)Ideal1724339.90Premium1106025.60Very Good963722.30Good39029.00Fair13103.00,,

0,1
size,43152.0
distinct,5.0
distinct(%),0.011
missing,0.0
missing(%),0.0

0,1,2
value,count,ratio(%)
Ideal,17243,39.90
Premium,11060,25.60
Very Good,9637,22.30
Good,3902,9.00
Fair,1310,3.00


----------

### 3. "color"

0,1,2,3
| Descriptive Statistics |,| Common Values |,| Bar Chart |,| Pie Chart |
size43152distinct7distinct(%)0.016missing0missing(%)0.0,valuecountratio(%)G903420.90E784418.10F762217.60H660815.30D544912.60I435610.00,,

0,1
size,43152.0
distinct,7.0
distinct(%),0.016
missing,0.0
missing(%),0.0

0,1,2
value,count,ratio(%)
G,9034,20.90
E,7844,18.10
F,7622,17.60
H,6608,15.30
D,5449,12.60
I,4356,10.00


----------

### 4. "clarity"

0,1,2,3
| Descriptive Statistics |,| Common Values |,| Bar Chart |,| Pie Chart |
size43152distinct8distinct(%)0.018missing0missing(%)0.0,valuecountratio(%)SI11046024.20VS2978122.60SI2733316.90VS1661215.30VVS240159.30VVS129226.70,,

0,1
size,43152.0
distinct,8.0
distinct(%),0.018
missing,0.0
missing(%),0.0

0,1,2
value,count,ratio(%)
SI1,10460,24.20
VS2,9781,22.60
SI2,7333,16.90
VS1,6612,15.30
VVS2,4015,9.30
VVS1,2922,6.70


----------

### 5. "depth"

0,1,2,3,4,5,6
| Descriptive Stat. |,| Descriptive Stat. |,| Quantile Stat. |,| Common Values |,| Min Values |,| Max Values |,| Histogram |
size43152distinct177distinct(%)0.41missing0missing(%)0.00minimum43.0maximum79.0,zeros0zeros(%)0.00mean61.75median61.80sum2664578.90sd1.44skewness-0.04,minimun43.05-th per.59.30Q161.00median61.8Q362.5095-th per.63.80maximum79.0,valuecountratio(%)62.017884.1061.917374.0061.816623.8062.216403.8062.116273.7062.315663.60,valuecountratio(%)43.020.0050.810.0051.010.0052.210.0052.710.0053.210.00,valuecountratio(%)71.810.0072.210.0072.910.0073.610.0078.210.0079.020.00,

0,1
size,43152.0
distinct,177.0
distinct(%),0.41
missing,0.0
missing(%),0.0
minimum,43.0
maximum,79.0

0,1
zeros,0.0
zeros(%),0.0
mean,61.75
median,61.8
sum,2664578.9
sd,1.44
skewness,-0.04

0,1
minimun,43.0
5-th per.,59.3
Q1,61.0
median,61.8
Q3,62.5
95-th per.,63.8
maximum,79.0

0,1,2
value,count,ratio(%)
62.0,1788,4.10
61.9,1737,4.00
61.8,1662,3.80
62.2,1640,3.80
62.1,1627,3.70
62.3,1566,3.60

0,1,2
value,count,ratio(%)
43.0,2,0.00
50.8,1,0.00
51.0,1,0.00
52.2,1,0.00
52.7,1,0.00
53.2,1,0.00

0,1,2
value,count,ratio(%)
71.8,1,0.00
72.2,1,0.00
72.9,1,0.00
73.6,1,0.00
78.2,1,0.00
79.0,2,0.00


----------

### 6. "table"

0,1,2,3,4,5,6
| Descriptive Stat. |,| Descriptive Stat. |,| Quantile Stat. |,| Common Values |,| Min Values |,| Max Values |,| Histogram |
size43152distinct123distinct(%)0.28missing0missing(%)0.00minimum43.0maximum95.0,zeros0zeros(%)0.00mean57.46median57.00sum2479515.80sd2.24skewness0.84,minimun43.05-th per.54.00Q156.00median57.0Q359.0095-th per.61.00maximum95.0,valuecountratio(%)56.0785618.2057.0777718.0058.0673115.5059.0525712.1055.0502311.6060.034187.90,valuecountratio(%)43.010.0044.010.0049.020.0051.070.0051.610.0052.0360.00,valuecountratio(%)70.090.0071.010.0073.040.0076.010.0079.010.0095.010.00,

0,1
size,43152.0
distinct,123.0
distinct(%),0.28
missing,0.0
missing(%),0.0
minimum,43.0
maximum,95.0

0,1
zeros,0.0
zeros(%),0.0
mean,57.46
median,57.0
sum,2479515.8
sd,2.24
skewness,0.84

0,1
minimun,43.0
5-th per.,54.0
Q1,56.0
median,57.0
Q3,59.0
95-th per.,61.0
maximum,95.0

0,1,2
value,count,ratio(%)
56.0,7856,18.20
57.0,7777,18.00
58.0,6731,15.50
59.0,5257,12.10
55.0,5023,11.60
60.0,3418,7.90

0,1,2
value,count,ratio(%)
43.0,1,0.00
44.0,1,0.00
49.0,2,0.00
51.0,7,0.00
51.6,1,0.00
52.0,36,0.00

0,1,2
value,count,ratio(%)
70.0,9,0.00
71.0,1,0.00
73.0,4,0.00
76.0,1,0.00
79.0,1,0.00
95.0,1,0.00


----------

### 7. "price"

0,1,2,3,4,5,6
| Descriptive Stat. |,| Descriptive Stat. |,| Quantile Stat. |,| Common Values |,| Min Values |,| Max Values |,| Histogram |
size43152distinct10645distinct(%)24.67missing0missing(%)0.00minimum326maximum18823,zeros0zeros(%)0.00mean3913.03median2394.00sum168855182.00sd3968.66skewness1.62,minimun326.05-th per.544.00Q1949.00median2394.0Q35296.2595-th per.13060.00maximum18823.0,valuecountratio(%)625.01070.20605.01050.20698.01000.20802.0980.20776.0980.20789.0980.20,valuecountratio(%)326.010.00327.010.00335.010.00336.020.00337.020.00338.010.00,valuecountratio(%)18788.010.0018791.010.0018795.010.0018804.010.0018806.010.0018823.010.00,

0,1
size,43152.0
distinct,10645.0
distinct(%),24.67
missing,0.0
missing(%),0.0
minimum,326.0
maximum,18823.0

0,1
zeros,0.0
zeros(%),0.0
mean,3913.03
median,2394.0
sum,168855182.0
sd,3968.66
skewness,1.62

0,1
minimun,326.0
5-th per.,544.0
Q1,949.0
median,2394.0
Q3,5296.25
95-th per.,13060.0
maximum,18823.0

0,1,2
value,count,ratio(%)
625.0,107,0.20
605.0,105,0.20
698.0,100,0.20
802.0,98,0.20
776.0,98,0.20
789.0,98,0.20

0,1,2
value,count,ratio(%)
326.0,1,0.00
327.0,1,0.00
335.0,1,0.00
336.0,2,0.00
337.0,2,0.00
338.0,1,0.00

0,1,2
value,count,ratio(%)
18788.0,1,0.00
18791.0,1,0.00
18795.0,1,0.00
18804.0,1,0.00
18806.0,1,0.00
18823.0,1,0.00


----------

### 8. "x"

0,1,2,3,4,5,6
| Descriptive Stat. |,| Descriptive Stat. |,| Quantile Stat. |,| Common Values |,| Min Values |,| Max Values |,| Histogram |
size43152distinct548distinct(%)1.27missing0missing(%)0.00minimum0.0maximum10.74,zeros6zeros(%)0.01mean5.73median5.69sum247128.96sd1.12skewness0.38,minimun0.05-th per.4.29Q14.71median5.69Q36.5395-th per.7.65maximum10.74,valuecountratio(%)4.373500.804.333470.804.343440.704.323360.704.383310.704.353270.70,valuecountratio(%)0.060.003.7320.003.7410.003.7610.003.7710.003.7910.00,valuecountratio(%)10.010.0010.0110.0010.0210.0010.1410.0010.2310.0010.7410.00,

0,1
size,43152.0
distinct,548.0
distinct(%),1.27
missing,0.0
missing(%),0.0
minimum,0.0
maximum,10.74

0,1
zeros,6.0
zeros(%),0.01
mean,5.73
median,5.69
sum,247128.96
sd,1.12
skewness,0.38

0,1
minimun,0.0
5-th per.,4.29
Q1,4.71
median,5.69
Q3,6.53
95-th per.,7.65
maximum,10.74

0,1,2
value,count,ratio(%)
4.37,350,0.80
4.33,347,0.80
4.34,344,0.70
4.32,336,0.70
4.38,331,0.70
4.35,327,0.70

0,1,2
value,count,ratio(%)
0.0,6,0.00
3.73,2,0.00
3.74,1,0.00
3.76,1,0.00
3.77,1,0.00
3.79,1,0.00

0,1,2
value,count,ratio(%)
10.0,1,0.00
10.01,1,0.00
10.02,1,0.00
10.14,1,0.00
10.23,1,0.00
10.74,1,0.00


----------

### 9. "y"

0,1,2,3,4,5,6
| Descriptive Stat. |,| Descriptive Stat. |,| Quantile Stat. |,| Common Values |,| Min Values |,| Max Values |,| Histogram |
size43152distinct545distinct(%)1.26missing0missing(%)0.00minimum0.0maximum58.9,zeros5zeros(%)0.01mean5.73median5.71sum247295.30sd1.15skewness2.92,minimun0.05-th per.4.29Q14.72median5.71Q36.5395-th per.7.64maximum58.9,valuecountratio(%)4.343510.804.373450.704.393340.704.333330.704.353310.704.383240.70,valuecountratio(%)0.050.003.6810.003.7120.003.7210.003.7310.003.7510.00,valuecountratio(%)9.9420.0010.110.0010.1610.0010.5410.0031.810.0058.910.00,

0,1
size,43152.0
distinct,545.0
distinct(%),1.26
missing,0.0
missing(%),0.0
minimum,0.0
maximum,58.9

0,1
zeros,5.0
zeros(%),0.01
mean,5.73
median,5.71
sum,247295.3
sd,1.15
skewness,2.92

0,1
minimun,0.0
5-th per.,4.29
Q1,4.72
median,5.71
Q3,6.53
95-th per.,7.64
maximum,58.9

0,1,2
value,count,ratio(%)
4.34,351,0.80
4.37,345,0.70
4.39,334,0.70
4.33,333,0.70
4.35,331,0.70
4.38,324,0.70

0,1,2
value,count,ratio(%)
0.0,5,0.00
3.68,1,0.00
3.71,2,0.00
3.72,1,0.00
3.73,1,0.00
3.75,1,0.00

0,1,2
value,count,ratio(%)
9.94,2,0.00
10.1,1,0.00
10.16,1,0.00
10.54,1,0.00
31.8,1,0.00
58.9,1,0.00


----------

### 10. "z"

0,1,2,3,4,5,6
| Descriptive Stat. |,| Descriptive Stat. |,| Quantile Stat. |,| Common Values |,| Min Values |,| Max Values |,| Histogram |
size43152distinct365distinct(%)0.84missing0missing(%)0.00minimum0.0maximum8.06,zeros17zeros(%)0.04mean3.54median3.52sum152565.54sd0.69skewness0.35,minimun0.05-th per.2.65Q12.91median3.52Q34.0395-th per.4.73maximum8.06,valuecountratio(%)2.76251.402.716171.402.696061.402.685911.302.725561.202.675141.10,valuecountratio(%)0.0170.001.0710.001.5310.002.0610.002.2410.002.2710.00,valuecountratio(%)6.3110.006.3810.006.4310.006.7210.006.9810.008.0610.00,

0,1
size,43152.0
distinct,365.0
distinct(%),0.84
missing,0.0
missing(%),0.0
minimum,0.0
maximum,8.06

0,1
zeros,17.0
zeros(%),0.04
mean,3.54
median,3.52
sum,152565.54
sd,0.69
skewness,0.35

0,1
minimun,0.0
5-th per.,2.65
Q1,2.91
median,3.52
Q3,4.03
95-th per.,4.73
maximum,8.06

0,1,2
value,count,ratio(%)
2.7,625,1.40
2.71,617,1.40
2.69,606,1.40
2.68,591,1.30
2.72,556,1.20
2.67,514,1.10

0,1,2
value,count,ratio(%)
0.0,17,0.00
1.07,1,0.00
1.53,1,0.00
2.06,1,0.00
2.24,1,0.00
2.27,1,0.00

0,1,2
value,count,ratio(%)
6.31,1,0.00
6.38,1,0.00
6.43,1,0.00
6.72,1,0.00
6.98,1,0.00
8.06,1,0.00


----------

In [79]:
# 데이터셋의 변수 정보를 출력
exp.render_variables_info({
    'set_name': 'Diamonds', 
    'dfs': [{'df_name': 'Train', 'df': df_dia_train}, {'df_name': 'Test', 'df': df_dia_test}], 
})

## Diamonds Variables

### 1. "carat"

0,1,2,3,4,5,6
| Descriptive Stat. |,| Descriptive Stat. |,| Quantile Stat. |,| Common Values |,| Min Values |,| Max Values |,| Histogram |
size43152distinct269distinct(%)0.62missing0missing(%)0.00minimum0.2maximum5.01,zeros0zeros(%)0.00mean0.80median0.70sum34356.38sd0.47skewness1.13,minimun0.25-th per.0.30Q10.40median0.7Q31.0495-th per.1.70maximum5.01,valuecountratio(%)0.320694.701.0118144.200.3118014.100.715863.600.3214863.401.012292.80,valuecountratio(%)0.290.000.2170.000.2250.000.232470.500.242170.500.251690.30,valuecountratio(%)3.6710.004.010.004.0120.004.1310.004.510.005.0110.00,

0,1
size,43152.0
distinct,269.0
distinct(%),0.62
missing,0.0
missing(%),0.0
minimum,0.2
maximum,5.01

0,1
zeros,0.0
zeros(%),0.0
mean,0.8
median,0.7
sum,34356.38
sd,0.47
skewness,1.13

0,1
minimun,0.2
5-th per.,0.3
Q1,0.4
median,0.7
Q3,1.04
95-th per.,1.7
maximum,5.01

0,1,2
value,count,ratio(%)
0.3,2069,4.70
1.01,1814,4.20
0.31,1801,4.10
0.7,1586,3.60
0.32,1486,3.40
1.0,1229,2.80

0,1,2
value,count,ratio(%)
0.2,9,0.00
0.21,7,0.00
0.22,5,0.00
0.23,247,0.50
0.24,217,0.50
0.25,169,0.30

0,1,2
value,count,ratio(%)
3.67,1,0.00
4.0,1,0.00
4.01,2,0.00
4.13,1,0.00
4.5,1,0.00
5.01,1,0.00


0,1,2,3,4,5,6
| Descriptive Stat. |,| Descriptive Stat. |,| Quantile Stat. |,| Common Values |,| Min Values |,| Max Values |,| Histogram |
size10788distinct234distinct(%)2.17missing0missing(%)0.00minimum0.2maximum3.51,zeros0zeros(%)0.00mean0.81median0.71sum8684.49sd0.48skewness1.05,minimun0.25-th per.0.30Q10.40median0.71Q31.0595-th per.1.71maximum3.51,valuecountratio(%)0.35354.900.314484.101.014283.900.73953.600.323543.201.03293.00,valuecountratio(%)0.230.000.2120.000.23460.400.24370.300.25430.300.26440.40,valuecountratio(%)2.7410.002.7710.003.010.003.0140.003.510.003.5110.00,

0,1
size,10788.0
distinct,234.0
distinct(%),2.17
missing,0.0
missing(%),0.0
minimum,0.2
maximum,3.51

0,1
zeros,0.0
zeros(%),0.0
mean,0.81
median,0.71
sum,8684.49
sd,0.48
skewness,1.05

0,1
minimun,0.2
5-th per.,0.3
Q1,0.4
median,0.71
Q3,1.05
95-th per.,1.71
maximum,3.51

0,1,2
value,count,ratio(%)
0.3,535,4.90
0.31,448,4.10
1.01,428,3.90
0.7,395,3.60
0.32,354,3.20
1.0,329,3.00

0,1,2
value,count,ratio(%)
0.2,3,0.00
0.21,2,0.00
0.23,46,0.40
0.24,37,0.30
0.25,43,0.30
0.26,44,0.40

0,1,2
value,count,ratio(%)
2.74,1,0.00
2.77,1,0.00
3.0,1,0.00
3.01,4,0.00
3.5,1,0.00
3.51,1,0.00


----------

### 2. "cut"

0,1,2,3
| Descriptive Statistics |,| Common Values |,| Bar Chart |,| Pie Chart |
size43152distinct5distinct(%)0.011missing0missing(%)0.0,valuecountratio(%)Ideal1724339.90Premium1106025.60Very Good963722.30Good39029.00Fair13103.00,,

0,1
size,43152.0
distinct,5.0
distinct(%),0.011
missing,0.0
missing(%),0.0

0,1,2
value,count,ratio(%)
Ideal,17243,39.90
Premium,11060,25.60
Very Good,9637,22.30
Good,3902,9.00
Fair,1310,3.00


0,1,2,3
| Descriptive Statistics |,| Common Values |,| Bar Chart |,| Pie Chart |
size10788distinct5distinct(%)0.046missing0missing(%)0.0,valuecountratio(%)Ideal430839.90Premium273125.30Very Good244522.60Good10049.30Fair3002.70,,

0,1
size,10788.0
distinct,5.0
distinct(%),0.046
missing,0.0
missing(%),0.0

0,1,2
value,count,ratio(%)
Ideal,4308,39.90
Premium,2731,25.30
Very Good,2445,22.60
Good,1004,9.30
Fair,300,2.70


----------

### 3. "color"

0,1,2,3
| Descriptive Statistics |,| Common Values |,| Bar Chart |,| Pie Chart |
size43152distinct7distinct(%)0.016missing0missing(%)0.0,valuecountratio(%)G903420.90E784418.10F762217.60H660815.30D544912.60I435610.00,,

0,1
size,43152.0
distinct,7.0
distinct(%),0.016
missing,0.0
missing(%),0.0

0,1,2
value,count,ratio(%)
G,9034,20.90
E,7844,18.10
F,7622,17.60
H,6608,15.30
D,5449,12.60
I,4356,10.00


0,1,2,3
| Descriptive Statistics |,| Common Values |,| Bar Chart |,| Pie Chart |
size10788distinct7distinct(%)0.064missing0missing(%)0.0,valuecountratio(%)G225820.90E195318.10F192017.70H169615.70D132612.20I10669.80,,

0,1
size,10788.0
distinct,7.0
distinct(%),0.064
missing,0.0
missing(%),0.0

0,1,2
value,count,ratio(%)
G,2258,20.90
E,1953,18.10
F,1920,17.70
H,1696,15.70
D,1326,12.20
I,1066,9.80


----------

### 4. "clarity"

0,1,2,3
| Descriptive Statistics |,| Common Values |,| Bar Chart |,| Pie Chart |
size43152distinct8distinct(%)0.018missing0missing(%)0.0,valuecountratio(%)SI11046024.20VS2978122.60SI2733316.90VS1661215.30VVS240159.30VVS129226.70,,

0,1
size,43152.0
distinct,8.0
distinct(%),0.018
missing,0.0
missing(%),0.0

0,1,2
value,count,ratio(%)
SI1,10460,24.20
VS2,9781,22.60
SI2,7333,16.90
VS1,6612,15.30
VVS2,4015,9.30
VVS1,2922,6.70


0,1,2,3
| Descriptive Statistics |,| Common Values |,| Bar Chart |,| Pie Chart |
size10788distinct8distinct(%)0.074missing0missing(%)0.0,valuecountratio(%)SI1260524.10VS2247722.90SI2186117.20VS1155914.40VVS210519.70VVS17336.70,,

0,1
size,10788.0
distinct,8.0
distinct(%),0.074
missing,0.0
missing(%),0.0

0,1,2
value,count,ratio(%)
SI1,2605,24.10
VS2,2477,22.90
SI2,1861,17.20
VS1,1559,14.40
VVS2,1051,9.70
VVS1,733,6.70


----------

### 5. "depth"

0,1,2,3,4,5,6
| Descriptive Stat. |,| Descriptive Stat. |,| Quantile Stat. |,| Common Values |,| Min Values |,| Max Values |,| Histogram |
size43152distinct177distinct(%)0.41missing0missing(%)0.00minimum43.0maximum79.0,zeros0zeros(%)0.00mean61.75median61.80sum2664578.90sd1.44skewness-0.04,minimun43.05-th per.59.30Q161.00median61.8Q362.5095-th per.63.80maximum79.0,valuecountratio(%)62.017884.1061.917374.0061.816623.8062.216403.8062.116273.7062.315663.60,valuecountratio(%)43.020.0050.810.0051.010.0052.210.0052.710.0053.210.00,valuecountratio(%)71.810.0072.210.0072.910.0073.610.0078.210.0079.020.00,

0,1
size,43152.0
distinct,177.0
distinct(%),0.41
missing,0.0
missing(%),0.0
minimum,43.0
maximum,79.0

0,1
zeros,0.0
zeros(%),0.0
mean,61.75
median,61.8
sum,2664578.9
sd,1.44
skewness,-0.04

0,1
minimun,43.0
5-th per.,59.3
Q1,61.0
median,61.8
Q3,62.5
95-th per.,63.8
maximum,79.0

0,1,2
value,count,ratio(%)
62.0,1788,4.10
61.9,1737,4.00
61.8,1662,3.80
62.2,1640,3.80
62.1,1627,3.70
62.3,1566,3.60

0,1,2
value,count,ratio(%)
43.0,2,0.00
50.8,1,0.00
51.0,1,0.00
52.2,1,0.00
52.7,1,0.00
53.2,1,0.00

0,1,2
value,count,ratio(%)
71.8,1,0.00
72.2,1,0.00
72.9,1,0.00
73.6,1,0.00
78.2,1,0.00
79.0,2,0.00


0,1,2,3,4,5,6
| Descriptive Stat. |,| Descriptive Stat. |,| Quantile Stat. |,| Common Values |,| Min Values |,| Max Values |,| Histogram |
size10788distinct138distinct(%)1.28missing0missing(%)0.00minimum44.0maximum71.6,zeros0zeros(%)0.00mean61.75median61.80sum666184.00sd1.41skewness-0.26,minimun44.05-th per.59.40Q161.00median61.8Q362.5095-th per.63.80maximum71.6,valuecountratio(%)62.04514.1061.94263.9061.84153.8061.74023.7061.64013.7062.23993.60,valuecountratio(%)44.010.0052.310.0053.010.0053.110.0053.210.0055.210.00,valuecountratio(%)70.010.0070.110.0070.210.0071.010.0071.210.0071.610.00,

0,1
size,10788.0
distinct,138.0
distinct(%),1.28
missing,0.0
missing(%),0.0
minimum,44.0
maximum,71.6

0,1
zeros,0.0
zeros(%),0.0
mean,61.75
median,61.8
sum,666184.0
sd,1.41
skewness,-0.26

0,1
minimun,44.0
5-th per.,59.4
Q1,61.0
median,61.8
Q3,62.5
95-th per.,63.8
maximum,71.6

0,1,2
value,count,ratio(%)
62.0,451,4.10
61.9,426,3.90
61.8,415,3.80
61.7,402,3.70
61.6,401,3.70
62.2,399,3.60

0,1,2
value,count,ratio(%)
44.0,1,0.00
52.3,1,0.00
53.0,1,0.00
53.1,1,0.00
53.2,1,0.00
55.2,1,0.00

0,1,2
value,count,ratio(%)
70.0,1,0.00
70.1,1,0.00
70.2,1,0.00
71.0,1,0.00
71.2,1,0.00
71.6,1,0.00


----------

### 6. "table"

0,1,2,3,4,5,6
| Descriptive Stat. |,| Descriptive Stat. |,| Quantile Stat. |,| Common Values |,| Min Values |,| Max Values |,| Histogram |
size43152distinct123distinct(%)0.28missing0missing(%)0.00minimum43.0maximum95.0,zeros0zeros(%)0.00mean57.46median57.00sum2479515.80sd2.24skewness0.84,minimun43.05-th per.54.00Q156.00median57.0Q359.0095-th per.61.00maximum95.0,valuecountratio(%)56.0785618.2057.0777718.0058.0673115.5059.0525712.1055.0502311.6060.034187.90,valuecountratio(%)43.010.0044.010.0049.020.0051.070.0051.610.0052.0360.00,valuecountratio(%)70.090.0071.010.0073.040.0076.010.0079.010.0095.010.00,

0,1
size,43152.0
distinct,123.0
distinct(%),0.28
missing,0.0
missing(%),0.0
minimum,43.0
maximum,95.0

0,1
zeros,0.0
zeros(%),0.0
mean,57.46
median,57.0
sum,2479515.8
sd,2.24
skewness,0.84

0,1
minimun,43.0
5-th per.,54.0
Q1,56.0
median,57.0
Q3,59.0
95-th per.,61.0
maximum,95.0

0,1,2
value,count,ratio(%)
56.0,7856,18.20
57.0,7777,18.00
58.0,6731,15.50
59.0,5257,12.10
55.0,5023,11.60
60.0,3418,7.90

0,1,2
value,count,ratio(%)
43.0,1,0.00
44.0,1,0.00
49.0,2,0.00
51.0,7,0.00
51.6,1,0.00
52.0,36,0.00

0,1,2
value,count,ratio(%)
70.0,9,0.00
71.0,1,0.00
73.0,4,0.00
76.0,1,0.00
79.0,1,0.00
95.0,1,0.00


0,1,2,3,4,5,6
| Descriptive Stat. |,| Descriptive Stat. |,| Quantile Stat. |,| Common Values |,| Min Values |,| Max Values |,| Histogram |
size10788distinct87distinct(%)0.81missing0missing(%)0.00minimum50.0maximum68.0,zeros0zeros(%)0.00mean57.45median57.00sum619724.70sd2.22skewness0.62,minimun50.05-th per.54.00Q156.00median57.0Q359.0095-th per.61.00maximum68.0,valuecountratio(%)56.0202518.7057.0194718.0058.0163815.1059.0131512.1055.0124511.5060.08237.60,valuecountratio(%)50.020.0050.110.0051.020.0052.0200.1052.410.0053.01181.00,valuecountratio(%)63.01241.1064.0570.5065.0320.2066.0150.1067.070.0068.040.00,

0,1
size,10788.0
distinct,87.0
distinct(%),0.81
missing,0.0
missing(%),0.0
minimum,50.0
maximum,68.0

0,1
zeros,0.0
zeros(%),0.0
mean,57.45
median,57.0
sum,619724.7
sd,2.22
skewness,0.62

0,1
minimun,50.0
5-th per.,54.0
Q1,56.0
median,57.0
Q3,59.0
95-th per.,61.0
maximum,68.0

0,1,2
value,count,ratio(%)
56.0,2025,18.70
57.0,1947,18.00
58.0,1638,15.10
59.0,1315,12.10
55.0,1245,11.50
60.0,823,7.60

0,1,2
value,count,ratio(%)
50.0,2,0.00
50.1,1,0.00
51.0,2,0.00
52.0,20,0.10
52.4,1,0.00
53.0,118,1.00

0,1,2
value,count,ratio(%)
63.0,124,1.10
64.0,57,0.50
65.0,32,0.20
66.0,15,0.10
67.0,7,0.00
68.0,4,0.00


----------

### 7. "price"

0,1,2,3,4,5,6
| Descriptive Stat. |,| Descriptive Stat. |,| Quantile Stat. |,| Common Values |,| Min Values |,| Max Values |,| Histogram |
size43152distinct10645distinct(%)24.67missing0missing(%)0.00minimum326maximum18823,zeros0zeros(%)0.00mean3913.03median2394.00sum168855182.00sd3968.66skewness1.62,minimun326.05-th per.544.00Q1949.00median2394.0Q35296.2595-th per.13060.00maximum18823.0,valuecountratio(%)625.01070.20605.01050.20698.01000.20802.0980.20776.0980.20789.0980.20,valuecountratio(%)326.010.00327.010.00335.010.00336.020.00337.020.00338.010.00,valuecountratio(%)18788.010.0018791.010.0018795.010.0018804.010.0018806.010.0018823.010.00,

0,1
size,43152.0
distinct,10645.0
distinct(%),24.67
missing,0.0
missing(%),0.0
minimum,326.0
maximum,18823.0

0,1
zeros,0.0
zeros(%),0.0
mean,3913.03
median,2394.0
sum,168855182.0
sd,3968.66
skewness,1.62

0,1
minimun,326.0
5-th per.,544.0
Q1,949.0
median,2394.0
Q3,5296.25
95-th per.,13060.0
maximum,18823.0

0,1,2
value,count,ratio(%)
625.0,107,0.20
605.0,105,0.20
698.0,100,0.20
802.0,98,0.20
776.0,98,0.20
789.0,98,0.20

0,1,2
value,count,ratio(%)
326.0,1,0.00
327.0,1,0.00
335.0,1,0.00
336.0,2,0.00
337.0,2,0.00
338.0,1,0.00

0,1,2
value,count,ratio(%)
18788.0,1,0.00
18791.0,1,0.00
18795.0,1,0.00
18804.0,1,0.00
18806.0,1,0.00
18823.0,1,0.00


0,1,2,3,4,5,6
| Descriptive Stat. |,| Descriptive Stat. |,| Quantile Stat. |,| Common Values |,| Min Values |,| Max Values |,| Histogram |
size10788distinct5394distinct(%)50.00missing0missing(%)0.00minimum326maximum18818,zeros0zeros(%)0.00mean4011.87median2447.00sum43280035.00sd4070.74skewness1.60,minimun326.05-th per.552.00Q1954.00median2447.0Q35431.5095-th per.13323.05maximum18818.0,valuecountratio(%)802.0290.20828.0270.20684.0270.20605.0270.20776.0260.20666.0260.20,valuecountratio(%)326.010.00334.010.00351.020.00357.010.00362.010.00363.010.00,valuecountratio(%)18779.010.0018791.010.0018795.010.0018797.010.0018803.010.0018818.010.00,

0,1
size,10788.0
distinct,5394.0
distinct(%),50.0
missing,0.0
missing(%),0.0
minimum,326.0
maximum,18818.0

0,1
zeros,0.0
zeros(%),0.0
mean,4011.87
median,2447.0
sum,43280035.0
sd,4070.74
skewness,1.6

0,1
minimun,326.0
5-th per.,552.0
Q1,954.0
median,2447.0
Q3,5431.5
95-th per.,13323.05
maximum,18818.0

0,1,2
value,count,ratio(%)
802.0,29,0.20
828.0,27,0.20
684.0,27,0.20
605.0,27,0.20
776.0,26,0.20
666.0,26,0.20

0,1,2
value,count,ratio(%)
326.0,1,0.00
334.0,1,0.00
351.0,2,0.00
357.0,1,0.00
362.0,1,0.00
363.0,1,0.00

0,1,2
value,count,ratio(%)
18779.0,1,0.00
18791.0,1,0.00
18795.0,1,0.00
18797.0,1,0.00
18803.0,1,0.00
18818.0,1,0.00


----------

### 8. "x"

0,1,2,3,4,5,6
| Descriptive Stat. |,| Descriptive Stat. |,| Quantile Stat. |,| Common Values |,| Min Values |,| Max Values |,| Histogram |
size43152distinct548distinct(%)1.27missing0missing(%)0.00minimum0.0maximum10.74,zeros6zeros(%)0.01mean5.73median5.69sum247128.96sd1.12skewness0.38,minimun0.05-th per.4.29Q14.71median5.69Q36.5395-th per.7.65maximum10.74,valuecountratio(%)4.373500.804.333470.804.343440.704.323360.704.383310.704.353270.70,valuecountratio(%)0.060.003.7320.003.7410.003.7610.003.7710.003.7910.00,valuecountratio(%)10.010.0010.0110.0010.0210.0010.1410.0010.2310.0010.7410.00,

0,1
size,43152.0
distinct,548.0
distinct(%),1.27
missing,0.0
missing(%),0.0
minimum,0.0
maximum,10.74

0,1
zeros,6.0
zeros(%),0.01
mean,5.73
median,5.69
sum,247128.96
sd,1.12
skewness,0.38

0,1
minimun,0.0
5-th per.,4.29
Q1,4.71
median,5.69
Q3,6.53
95-th per.,7.65
maximum,10.74

0,1,2
value,count,ratio(%)
4.37,350,0.80
4.33,347,0.80
4.34,344,0.70
4.32,336,0.70
4.38,331,0.70
4.35,327,0.70

0,1,2
value,count,ratio(%)
0.0,6,0.00
3.73,2,0.00
3.74,1,0.00
3.76,1,0.00
3.77,1,0.00
3.79,1,0.00

0,1,2
value,count,ratio(%)
10.0,1,0.00
10.01,1,0.00
10.02,1,0.00
10.14,1,0.00
10.23,1,0.00
10.74,1,0.00


0,1,2,3,4,5,6
| Descriptive Stat. |,| Descriptive Stat. |,| Quantile Stat. |,| Common Values |,| Min Values |,| Max Values |,| Histogram |
size10788distinct502distinct(%)4.65missing0missing(%)0.00minimum0.0maximum9.66,zeros2zeros(%)0.02mean5.75median5.71sum62009.66sd1.13skewness0.36,minimun0.05-th per.4.29Q14.71median5.71Q36.5695-th per.7.71maximum9.66,valuecountratio(%)4.37980.904.38970.804.34930.804.32890.804.33820.704.29810.70,valuecountratio(%)0.020.003.7910.003.8210.003.8410.003.8520.003.8620.00,valuecountratio(%)9.0810.009.110.009.2410.009.3210.009.6510.009.6610.00,

0,1
size,10788.0
distinct,502.0
distinct(%),4.65
missing,0.0
missing(%),0.0
minimum,0.0
maximum,9.66

0,1
zeros,2.0
zeros(%),0.02
mean,5.75
median,5.71
sum,62009.66
sd,1.13
skewness,0.36

0,1
minimun,0.0
5-th per.,4.29
Q1,4.71
median,5.71
Q3,6.56
95-th per.,7.71
maximum,9.66

0,1,2
value,count,ratio(%)
4.37,98,0.90
4.38,97,0.80
4.34,93,0.80
4.32,89,0.80
4.33,82,0.70
4.29,81,0.70

0,1,2
value,count,ratio(%)
0.0,2,0.00
3.79,1,0.00
3.82,1,0.00
3.84,1,0.00
3.85,2,0.00
3.86,2,0.00

0,1,2
value,count,ratio(%)
9.08,1,0.00
9.1,1,0.00
9.24,1,0.00
9.32,1,0.00
9.65,1,0.00
9.66,1,0.00


----------

### 9. "y"

0,1,2,3,4,5,6
| Descriptive Stat. |,| Descriptive Stat. |,| Quantile Stat. |,| Common Values |,| Min Values |,| Max Values |,| Histogram |
size43152distinct545distinct(%)1.26missing0missing(%)0.00minimum0.0maximum58.9,zeros5zeros(%)0.01mean5.73median5.71sum247295.30sd1.15skewness2.92,minimun0.05-th per.4.29Q14.72median5.71Q36.5395-th per.7.64maximum58.9,valuecountratio(%)4.343510.804.373450.704.393340.704.333330.704.353310.704.383240.70,valuecountratio(%)0.050.003.6810.003.7120.003.7210.003.7310.003.7510.00,valuecountratio(%)9.9420.0010.110.0010.1610.0010.5410.0031.810.0058.910.00,

0,1
size,43152.0
distinct,545.0
distinct(%),1.26
missing,0.0
missing(%),0.0
minimum,0.0
maximum,58.9

0,1
zeros,5.0
zeros(%),0.01
mean,5.73
median,5.71
sum,247295.3
sd,1.15
skewness,2.92

0,1
minimun,0.0
5-th per.,4.29
Q1,4.72
median,5.71
Q3,6.53
95-th per.,7.64
maximum,58.9

0,1,2
value,count,ratio(%)
4.34,351,0.80
4.37,345,0.70
4.39,334,0.70
4.33,333,0.70
4.35,331,0.70
4.38,324,0.70

0,1,2
value,count,ratio(%)
0.0,5,0.00
3.68,1,0.00
3.71,2,0.00
3.72,1,0.00
3.73,1,0.00
3.75,1,0.00

0,1,2
value,count,ratio(%)
9.94,2,0.00
10.1,1,0.00
10.16,1,0.00
10.54,1,0.00
31.8,1,0.00
58.9,1,0.00


0,1,2,3,4,5,6
| Descriptive Stat. |,| Descriptive Stat. |,| Quantile Stat. |,| Common Values |,| Min Values |,| Max Values |,| Histogram |
size10788distinct497distinct(%)4.61missing0missing(%)0.00minimum0.0maximum9.63,zeros2zeros(%)0.02mean5.75median5.72sum62025.03sd1.12skewness0.35,minimun0.05-th per.4.30Q14.73median5.72Q36.5695-th per.7.69maximum9.63,valuecountratio(%)4.35940.804.37900.804.32900.804.33880.804.41870.804.34860.70,valuecountratio(%)0.020.003.7710.003.7810.003.810.003.8110.003.8410.00,valuecountratio(%)8.9710.009.0120.009.1310.009.1910.009.5910.009.6310.00,

0,1
size,10788.0
distinct,497.0
distinct(%),4.61
missing,0.0
missing(%),0.0
minimum,0.0
maximum,9.63

0,1
zeros,2.0
zeros(%),0.02
mean,5.75
median,5.72
sum,62025.03
sd,1.12
skewness,0.35

0,1
minimun,0.0
5-th per.,4.3
Q1,4.73
median,5.72
Q3,6.56
95-th per.,7.69
maximum,9.63

0,1,2
value,count,ratio(%)
4.35,94,0.80
4.37,90,0.80
4.32,90,0.80
4.33,88,0.80
4.41,87,0.80
4.34,86,0.70

0,1,2
value,count,ratio(%)
0.0,2,0.00
3.77,1,0.00
3.78,1,0.00
3.8,1,0.00
3.81,1,0.00
3.84,1,0.00

0,1,2
value,count,ratio(%)
8.97,1,0.00
9.01,2,0.00
9.13,1,0.00
9.19,1,0.00
9.59,1,0.00
9.63,1,0.00


----------

### 10. "z"

0,1,2,3,4,5,6
| Descriptive Stat. |,| Descriptive Stat. |,| Quantile Stat. |,| Common Values |,| Min Values |,| Max Values |,| Histogram |
size43152distinct365distinct(%)0.84missing0missing(%)0.00minimum0.0maximum8.06,zeros17zeros(%)0.04mean3.54median3.52sum152565.54sd0.69skewness0.35,minimun0.05-th per.2.65Q12.91median3.52Q34.0395-th per.4.73maximum8.06,valuecountratio(%)2.76251.402.716171.402.696061.402.685911.302.725561.202.675141.10,valuecountratio(%)0.0170.001.0710.001.5310.002.0610.002.2410.002.2710.00,valuecountratio(%)6.3110.006.3810.006.4310.006.7210.006.9810.008.0610.00,

0,1
size,43152.0
distinct,365.0
distinct(%),0.84
missing,0.0
missing(%),0.0
minimum,0.0
maximum,8.06

0,1
zeros,17.0
zeros(%),0.04
mean,3.54
median,3.52
sum,152565.54
sd,0.69
skewness,0.35

0,1
minimun,0.0
5-th per.,2.65
Q1,2.91
median,3.52
Q3,4.03
95-th per.,4.73
maximum,8.06

0,1,2
value,count,ratio(%)
2.7,625,1.40
2.71,617,1.40
2.69,606,1.40
2.68,591,1.30
2.72,556,1.20
2.67,514,1.10

0,1,2
value,count,ratio(%)
0.0,17,0.00
1.07,1,0.00
1.53,1,0.00
2.06,1,0.00
2.24,1,0.00
2.27,1,0.00

0,1,2
value,count,ratio(%)
6.31,1,0.00
6.38,1,0.00
6.43,1,0.00
6.72,1,0.00
6.98,1,0.00
8.06,1,0.00


0,1,2,3,4,5,6
| Descriptive Stat. |,| Descriptive Stat. |,| Quantile Stat. |,| Common Values |,| Min Values |,| Max Values |,| Histogram |
size10788distinct325distinct(%)3.01missing0missing(%)0.00minimum0.0maximum31.8,zeros3zeros(%)0.03mean3.55median3.53sum38313.76sd0.75skewness5.27,minimun0.05-th per.2.66Q12.91median3.53Q34.0495-th per.4.75maximum31.8,valuecountratio(%)2.691421.302.71421.302.721411.302.681391.202.671351.202.731251.10,valuecountratio(%)0.030.001.4110.002.2510.002.2610.002.2810.002.310.00,valuecountratio(%)5.6710.005.7310.005.7710.005.8610.006.0320.0031.810.00,

0,1
size,10788.0
distinct,325.0
distinct(%),3.01
missing,0.0
missing(%),0.0
minimum,0.0
maximum,31.8

0,1
zeros,3.0
zeros(%),0.03
mean,3.55
median,3.53
sum,38313.76
sd,0.75
skewness,5.27

0,1
minimun,0.0
5-th per.,2.66
Q1,2.91
median,3.53
Q3,4.04
95-th per.,4.75
maximum,31.8

0,1,2
value,count,ratio(%)
2.69,142,1.30
2.7,142,1.30
2.72,141,1.30
2.68,139,1.20
2.67,135,1.20
2.73,125,1.10

0,1,2
value,count,ratio(%)
0.0,3,0.00
1.41,1,0.00
2.25,1,0.00
2.26,1,0.00
2.28,1,0.00
2.3,1,0.00

0,1,2
value,count,ratio(%)
5.67,1,0.00
5.73,1,0.00
5.77,1,0.00
5.86,1,0.00
6.03,2,0.00
31.8,1,0.00


----------

## 3. Target by Feature Render 함수

### 3.1 render_target_by_feature_clf

In [55]:
exp.render_target_by_feature_clf(df_titanic.drop(columns=['Name', 'Ticket', 'Cabin']), target='Survived', set_name='Titanic')

## Titanic Target Distributiones

0,1
"""Survived"" by ""PassengerId""","""Survived"" by ""PassengerId"""
Class Distribution,Normalized Distribution
,


0,1
"""Survived"" by ""SibSp""","""Survived"" by ""SibSp"""
Class Distribution,Normalized Distribution
,


0,1
"""Survived"" by ""Parch""","""Survived"" by ""Parch"""
Class Distribution,Normalized Distribution
,


0,1
"""Survived"" by ""Age""","""Survived"" by ""Age"""
Class Distribution,Normalized Distribution
,


0,1
"""Survived"" by ""Fare""","""Survived"" by ""Fare"""
Class Distribution,Normalized Distribution
,


0,1
"""Survived"" by ""Pclass""","""Survived"" by ""Pclass"""
Class Counts,Normalized Counts
,


0,1
"""Survived"" by ""Sex""","""Survived"" by ""Sex"""
Class Counts,Normalized Counts
,


0,1
"""Survived"" by ""Embarked""","""Survived"" by ""Embarked"""
Class Counts,Normalized Counts
,


### 3.2 render_target_by_feature_reg

In [56]:
exp.render_target_by_feature_reg(df_diamonds, target='price', set_name='Diamonds')

## Diamonds Target Distributiones

0,1,2
"""price"" Distribution by ""carat""","""price"" Distribution by ""carat""","""price"" Distribution by ""carat"""
,,


0,1,2
"""price"" Distribution by ""depth""","""price"" Distribution by ""depth""","""price"" Distribution by ""depth"""
,,


0,1,2
"""price"" Distribution by ""table""","""price"" Distribution by ""table""","""price"" Distribution by ""table"""
,,


0,1,2
"""price"" Distribution by ""x""","""price"" Distribution by ""x""","""price"" Distribution by ""x"""
,,


0,1,2
"""price"" Distribution by ""y""","""price"" Distribution by ""y""","""price"" Distribution by ""y"""
,,


0,1,2
"""price"" Distribution by ""z""","""price"" Distribution by ""z""","""price"" Distribution by ""z"""
,,


0,1
"""price"" Distribution by ""cut""","""price"" Distribution by ""cut"""
,


0,1
"""price"" Distribution by ""color""","""price"" Distribution by ""color"""
,


0,1
"""price"" Distribution by ""clarity""","""price"" Distribution by ""clarity"""
,
