## pandas-profiling Meteorites example
Source of data: https://data.nasa.gov/Space-Science/Meteorite-Landings/gh4g-9sfh

### Import libraries

In [1]:
import pandas as pd
import pandas_profiling
import numpy as np

In [2]:
%%javascript
require.config({
paths: {
d3: "https://d3js.org/d3.v5.min",
}
});

require(["d3"], function(d3) {
window.d3 = d3;
});

<IPython.core.display.Javascript object>

### Load and prepare example dataset
We add some fake variables for illustrating pandas-profiling capabilities

In [15]:
df = pd.DataFrame({'porta': ['duas', 'quatro', 'duas', 'quatro', 'quatro', 'duas', 'duas'],
                   'combustivel': ['gas', 'diesel', 'gas', 'gas', 'diesel', 'diesel', 'gas'],
                   'body-style': ['sedan', 'hatch', 'hatch', 'sedan', 'sedan', 'hatch', 'hatch']
                   })

In [5]:
columns = ["symboling", "normalized-losses", "make", "fuel-type", "aspiration", "num-of-doors", "body-style", "drive-wheels", "engine-location", "wheel-base", "length", "width", "height",
           "curb-weight", "engine-type", "num-of-cylinders", "engine-size", "fuel-system", "bore", "stroke", "compression-ratio", "horsepower", "peak-rpm", "city-mpg", "highway-mpg", "price"]

df = pd.read_csv('imports-85.data', names=columns)

for col in df.columns:
    df[col] = pd.to_numeric(df[col], errors='ignore')

df.replace(to_replace=["na", "?", np.nan, "missing", "not available","n/a", "missing value"], value=np.nan, inplace=True)

In [4]:
df=pd.read_csv("Meteorite_Landings.csv", parse_dates=['year'], encoding='UTF-8')

# Note: Pandas does not support dates before 1880, so we ignore these for this analysis
df['year'] = pd.to_datetime(df['year'], errors='coerce')

# Example: Constant variable
df['source'] = "NASA"

# Example: Boolean variable
df['boolean'] = np.random.choice([True, False], df.shape[0])

# Example: Mixed with base types
df['mixed'] = np.random.choice([1, "A"], df.shape[0])

# Example: Highly correlated variables
df['reclat_city'] = df['reclat'] + np.random.normal(scale=5,size=(len(df)))

# Example: Duplicate observations
duplicates_to_add = pd.DataFrame(df.iloc[0:10])
duplicates_to_add[u'name'] = duplicates_to_add[u'name'] + " copy"

df = df.append(duplicates_to_add, ignore_index=True)

### Inline report without saving object

In [6]:
pandas_profiling.ProfileReport(df)

  variable_stats = pd.concat(ldesc, join_axes=pd.Index([names]), axis=1)


0,1
Total size in memory,41.8 KiB
Average record size in memory,208.6 B

0,1
Distinct count,6
Unique (%),2.9%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0
Zeros (%),32.7%

0,1
Minimum,-2
5-th percentile,-1
Q1,0
Median,1
Q3,2
95-th percentile,3
Maximum,3
Range,5
Interquartile range,2

0,1
Standard deviation,1.2453
Coef of variation,1.4929
Kurtosis,-0.67627
Mean,0.83415
MAD,1.0219
Skewness,0.21107
Sum,171
Variance,1.5508
Memory size,1.7 KiB

Value,Count,Frequency (%),Unnamed: 3
0,67,32.7%,
1,54,26.3%,
2,32,15.6%,
3,27,13.2%,
-1,22,10.7%,
-2,3,1.5%,

Value,Count,Frequency (%),Unnamed: 3
-2,3,1.5%,
-1,22,10.7%,
0,67,32.7%,
1,54,26.3%,
2,32,15.6%,

Value,Count,Frequency (%),Unnamed: 3
-1,22,10.7%,
0,67,32.7%,
1,54,26.3%,
2,32,15.6%,
3,27,13.2%,

0,1
Distinct count,52
Unique (%),25.4%
Missing (%),20.0%
Missing (n),41
Infinite (%),0.0%
Infinite (n),0
Zeros (%),0.0%

0,1
Minimum,65
5-th percentile,74
Q1,94
Median,115
Q3,150
95-th percentile,188
Maximum,256
Range,191
Interquartile range,56

0,1
Standard deviation,35.442
Coef of variation,0.29051
Kurtosis,0.52544
Mean,122
MAD,29.122
Skewness,0.76598
Sum,20008
Variance,1256.1
Memory size,1.7 KiB

Value,Count,Frequency (%),Unnamed: 3
161.0,11,5.4%,
91.0,8,3.9%,
150.0,7,3.4%,
104.0,6,2.9%,
134.0,6,2.9%,
128.0,6,2.9%,
94.0,5,2.4%,
74.0,5,2.4%,
85.0,5,2.4%,
103.0,5,2.4%,

Value,Count,Frequency (%),Unnamed: 3
65.0,5,2.4%,
74.0,5,2.4%,
77.0,1,0.5%,
78.0,1,0.5%,
81.0,2,1.0%,

Value,Count,Frequency (%),Unnamed: 3
192.0,2,1.0%,
194.0,2,1.0%,
197.0,2,1.0%,
231.0,1,0.5%,
256.0,1,0.5%,

0,1
Distinct count,22
Unique (%),10.7%
Missing (%),0.0%
Missing (n),0

0,1
toyota,32
nissan,18
mazda,17
Other values (19),138

Value,Count,Frequency (%),Unnamed: 3
toyota,32,15.6%,
nissan,18,8.8%,
mazda,17,8.3%,
honda,13,6.3%,
mitsubishi,13,6.3%,
volkswagen,12,5.9%,
subaru,12,5.9%,
peugot,11,5.4%,
volvo,11,5.4%,
dodge,9,4.4%,

0,1
Distinct count,2
Unique (%),1.0%
Missing (%),0.0%
Missing (n),0

0,1
gas,185
diesel,20

Value,Count,Frequency (%),Unnamed: 3
gas,185,90.2%,
diesel,20,9.8%,

0,1
Distinct count,2
Unique (%),1.0%
Missing (%),0.0%
Missing (n),0

0,1
std,168
turbo,37

Value,Count,Frequency (%),Unnamed: 3
std,168,82.0%,
turbo,37,18.0%,

0,1
Distinct count,3
Unique (%),1.5%
Missing (%),1.0%
Missing (n),2

0,1
four,114
two,89
(Missing),2

Value,Count,Frequency (%),Unnamed: 3
four,114,55.6%,
two,89,43.4%,
(Missing),2,1.0%,

0,1
Distinct count,5
Unique (%),2.4%
Missing (%),0.0%
Missing (n),0

0,1
sedan,96
hatchback,70
wagon,25
Other values (2),14

Value,Count,Frequency (%),Unnamed: 3
sedan,96,46.8%,
hatchback,70,34.1%,
wagon,25,12.2%,
hardtop,8,3.9%,
convertible,6,2.9%,

0,1
Distinct count,3
Unique (%),1.5%
Missing (%),0.0%
Missing (n),0

0,1
fwd,120
rwd,76
4wd,9

Value,Count,Frequency (%),Unnamed: 3
fwd,120,58.5%,
rwd,76,37.1%,
4wd,9,4.4%,

0,1
Distinct count,2
Unique (%),1.0%
Missing (%),0.0%
Missing (n),0

0,1
front,202
rear,3

Value,Count,Frequency (%),Unnamed: 3
front,202,98.5%,
rear,3,1.5%,

0,1
Distinct count,53
Unique (%),25.9%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0
Zeros (%),0.0%

0,1
Minimum,86.6
5-th percentile,93.02
Q1,94.5
Median,97.0
Q3,102.4
95-th percentile,110.0
Maximum,120.9
Range,34.3
Interquartile range,7.9

0,1
Standard deviation,6.0218
Coef of variation,0.060976
Kurtosis,1.017
Mean,98.757
MAD,4.6622
Skewness,1.0502
Sum,20245
Variance,36.262
Memory size,1.7 KiB

Value,Count,Frequency (%),Unnamed: 3
94.5,21,10.2%,
93.7,20,9.8%,
95.7,13,6.3%,
96.5,8,3.9%,
98.4,7,3.4%,
97.3,7,3.4%,
96.3,6,2.9%,
107.9,6,2.9%,
98.8,6,2.9%,
99.1,6,2.9%,

Value,Count,Frequency (%),Unnamed: 3
86.6,2,1.0%,
88.4,1,0.5%,
88.6,2,1.0%,
89.5,3,1.5%,
91.3,2,1.0%,

Value,Count,Frequency (%),Unnamed: 3
112.0,1,0.5%,
113.0,2,1.0%,
114.2,4,2.0%,
115.6,2,1.0%,
120.9,1,0.5%,

0,1
Distinct count,75
Unique (%),36.6%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0
Zeros (%),0.0%

0,1
Minimum,141.1
5-th percentile,157.14
Q1,166.3
Median,173.2
Q3,183.1
95-th percentile,196.36
Maximum,208.1
Range,67.0
Interquartile range,16.8

0,1
Standard deviation,12.337
Coef of variation,0.070884
Kurtosis,-0.082895
Mean,174.05
MAD,9.5943
Skewness,0.15595
Sum,35680
Variance,152.21
Memory size,1.7 KiB

Value,Count,Frequency (%),Unnamed: 3
157.3,15,7.3%,
188.8,11,5.4%,
166.3,7,3.4%,
171.7,7,3.4%,
186.7,7,3.4%,
165.3,6,2.9%,
177.8,6,2.9%,
176.2,6,2.9%,
186.6,6,2.9%,
176.8,5,2.4%,

Value,Count,Frequency (%),Unnamed: 3
141.1,1,0.5%,
144.6,2,1.0%,
150.0,3,1.5%,
155.9,3,1.5%,
156.9,1,0.5%,

Value,Count,Frequency (%),Unnamed: 3
198.9,4,2.0%,
199.2,1,0.5%,
199.6,2,1.0%,
202.6,2,1.0%,
208.1,1,0.5%,

0,1
Distinct count,44
Unique (%),21.5%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0
Zeros (%),0.0%

0,1
Minimum,60.3
5-th percentile,63.6
Q1,64.1
Median,65.5
Q3,66.9
95-th percentile,70.46
Maximum,72.3
Range,12.0
Interquartile range,2.8

0,1
Standard deviation,2.1452
Coef of variation,0.032549
Kurtosis,0.70276
Mean,65.908
MAD,1.6783
Skewness,0.904
Sum,13511
Variance,4.6019
Memory size,1.7 KiB

Value,Count,Frequency (%),Unnamed: 3
63.8,24,11.7%,
66.5,23,11.2%,
65.4,15,7.3%,
63.6,11,5.4%,
64.4,10,4.9%,
68.4,10,4.9%,
64.0,9,4.4%,
65.5,8,3.9%,
65.2,7,3.4%,
66.3,6,2.9%,

Value,Count,Frequency (%),Unnamed: 3
60.3,1,0.5%,
61.8,1,0.5%,
62.5,1,0.5%,
63.4,1,0.5%,
63.6,11,5.4%,

Value,Count,Frequency (%),Unnamed: 3
70.9,1,0.5%,
71.4,3,1.5%,
71.7,3,1.5%,
72.0,1,0.5%,
72.3,1,0.5%,

0,1
Distinct count,49
Unique (%),23.9%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0
Zeros (%),0.0%

0,1
Minimum,47.8
5-th percentile,49.7
Q1,52.0
Median,54.1
Q3,55.5
95-th percentile,57.5
Maximum,59.8
Range,12.0
Interquartile range,3.5

0,1
Standard deviation,2.4435
Coef of variation,0.045482
Kurtosis,-0.44381
Mean,53.725
MAD,2.015
Skewness,0.063123
Sum,11014
Variance,5.9708
Memory size,1.7 KiB

Value,Count,Frequency (%),Unnamed: 3
50.8,14,6.8%,
52.0,12,5.9%,
55.7,12,5.9%,
54.5,10,4.9%,
54.1,10,4.9%,
55.5,9,4.4%,
56.7,8,3.9%,
54.3,8,3.9%,
51.6,7,3.4%,
56.1,7,3.4%,

Value,Count,Frequency (%),Unnamed: 3
47.8,1,0.5%,
48.8,2,1.0%,
49.4,2,1.0%,
49.6,4,2.0%,
49.7,3,1.5%,

Value,Count,Frequency (%),Unnamed: 3
57.5,3,1.5%,
58.3,1,0.5%,
58.7,4,2.0%,
59.1,3,1.5%,
59.8,2,1.0%,

0,1
Distinct count,171
Unique (%),83.4%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0
Zeros (%),0.0%

0,1
Minimum,1488
5-th percentile,1901
Q1,2145
Median,2414
Q3,2935
95-th percentile,3503
Maximum,4066
Range,2578
Interquartile range,790

0,1
Standard deviation,520.68
Coef of variation,0.20374
Kurtosis,-0.042854
Mean,2555.6
MAD,428.27
Skewness,0.6814
Sum,523891
Variance,271110
Memory size,1.7 KiB

Value,Count,Frequency (%),Unnamed: 3
2385,4,2.0%,
1989,3,1.5%,
1918,3,1.5%,
2275,3,1.5%,
3230,2,1.0%,
2410,2,1.0%,
3252,2,1.0%,
2337,2,1.0%,
2403,2,1.0%,
2414,2,1.0%,

Value,Count,Frequency (%),Unnamed: 3
1488,1,0.5%,
1713,1,0.5%,
1819,1,0.5%,
1837,1,0.5%,
1874,2,1.0%,

Value,Count,Frequency (%),Unnamed: 3
3750,1,0.5%,
3770,1,0.5%,
3900,1,0.5%,
3950,1,0.5%,
4066,2,1.0%,

0,1
Distinct count,7
Unique (%),3.4%
Missing (%),0.0%
Missing (n),0

0,1
ohc,148
ohcf,15
ohcv,13
Other values (4),29

Value,Count,Frequency (%),Unnamed: 3
ohc,148,72.2%,
ohcf,15,7.3%,
ohcv,13,6.3%,
dohc,12,5.9%,
l,12,5.9%,
rotor,4,2.0%,
dohcv,1,0.5%,

0,1
Distinct count,7
Unique (%),3.4%
Missing (%),0.0%
Missing (n),0

0,1
four,159
six,24
five,11
Other values (4),11

Value,Count,Frequency (%),Unnamed: 3
four,159,77.6%,
six,24,11.7%,
five,11,5.4%,
eight,5,2.4%,
two,4,2.0%,
three,1,0.5%,
twelve,1,0.5%,

0,1
Distinct count,44
Unique (%),21.5%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0
Zeros (%),0.0%

0,1
Minimum,61.0
5-th percentile,90.0
Q1,97.0
Median,120.0
Q3,141.0
95-th percentile,201.2
Maximum,326.0
Range,265.0
Interquartile range,44.0

0,1
Standard deviation,41.643
Coef of variation,0.32813
Kurtosis,5.3057
Mean,126.91
MAD,30.224
Skewness,1.9477
Sum,26016
Variance,1734.1
Memory size,1.7 KiB

Value,Count,Frequency (%),Unnamed: 3
122,15,7.3%,
92,15,7.3%,
98,14,6.8%,
97,14,6.8%,
108,13,6.3%,
90,12,5.9%,
110,12,5.9%,
109,8,3.9%,
120,7,3.4%,
141,7,3.4%,

Value,Count,Frequency (%),Unnamed: 3
61,1,0.5%,
70,3,1.5%,
79,1,0.5%,
80,1,0.5%,
90,12,5.9%,

Value,Count,Frequency (%),Unnamed: 3
234,2,1.0%,
258,2,1.0%,
304,1,0.5%,
308,1,0.5%,
326,1,0.5%,

0,1
Distinct count,8
Unique (%),3.9%
Missing (%),0.0%
Missing (n),0

0,1
mpfi,94
2bbl,66
idi,20
Other values (5),25

Value,Count,Frequency (%),Unnamed: 3
mpfi,94,45.9%,
2bbl,66,32.2%,
idi,20,9.8%,
1bbl,11,5.4%,
spdi,9,4.4%,
4bbl,3,1.5%,
spfi,1,0.5%,
mfi,1,0.5%,

0,1
Distinct count,39
Unique (%),19.0%
Missing (%),2.0%
Missing (n),4
Infinite (%),0.0%
Infinite (n),0
Zeros (%),0.0%

0,1
Minimum,2.54
5-th percentile,2.97
Q1,3.15
Median,3.31
Q3,3.59
95-th percentile,3.78
Maximum,3.94
Range,1.4
Interquartile range,0.44

0,1
Standard deviation,0.27354
Coef of variation,0.08215
Kurtosis,-0.82895
Mean,3.3298
MAD,0.23576
Skewness,0.020016
Sum,669.28
Variance,0.074823
Memory size,1.7 KiB

Value,Count,Frequency (%),Unnamed: 3
3.62,23,11.2%,
3.19,20,9.8%,
3.15,15,7.3%,
2.97,12,5.9%,
3.03,12,5.9%,
3.46,9,4.4%,
3.78,8,3.9%,
3.43,8,3.9%,
3.31,8,3.9%,
3.27,7,3.4%,

Value,Count,Frequency (%),Unnamed: 3
2.54,1,0.5%,
2.68,1,0.5%,
2.91,7,3.4%,
2.92,1,0.5%,
2.97,12,5.9%,

Value,Count,Frequency (%),Unnamed: 3
3.74,3,1.5%,
3.76,1,0.5%,
3.78,8,3.9%,
3.8,2,1.0%,
3.94,2,1.0%,

0,1
Distinct count,37
Unique (%),18.0%
Missing (%),2.0%
Missing (n),4
Infinite (%),0.0%
Infinite (n),0
Zeros (%),0.0%

0,1
Minimum,2.07
5-th percentile,2.64
Q1,3.11
Median,3.29
Q3,3.41
95-th percentile,3.64
Maximum,4.17
Range,2.1
Interquartile range,0.3

0,1
Standard deviation,0.31672
Coef of variation,0.097289
Kurtosis,2.0742
Mean,3.2554
MAD,0.23178
Skewness,-0.68312
Sum,654.34
Variance,0.10031
Memory size,1.7 KiB

Value,Count,Frequency (%),Unnamed: 3
3.4,20,9.8%,
3.03,14,6.8%,
3.15,14,6.8%,
3.23,14,6.8%,
3.39,13,6.3%,
2.64,11,5.4%,
3.35,9,4.4%,
3.29,9,4.4%,
3.46,8,3.9%,
3.07,6,2.9%,

Value,Count,Frequency (%),Unnamed: 3
2.07,1,0.5%,
2.19,2,1.0%,
2.36,1,0.5%,
2.64,11,5.4%,
2.68,2,1.0%,

Value,Count,Frequency (%),Unnamed: 3
3.58,6,2.9%,
3.64,5,2.4%,
3.86,4,2.0%,
3.9,3,1.5%,
4.17,2,1.0%,

0,1
Distinct count,32
Unique (%),15.6%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0
Zeros (%),0.0%

0,1
Minimum,7.0
5-th percentile,7.5
Q1,8.6
Median,9.0
Q3,9.4
95-th percentile,21.82
Maximum,23.0
Range,16.0
Interquartile range,0.8

0,1
Standard deviation,3.972
Coef of variation,0.39162
Kurtosis,5.2331
Mean,10.143
MAD,2.3279
Skewness,2.6109
Sum,2079.2
Variance,15.777
Memory size,1.7 KiB

Value,Count,Frequency (%),Unnamed: 3
9.0,46,22.4%,
9.4,26,12.7%,
8.5,14,6.8%,
9.5,13,6.3%,
9.3,11,5.4%,
8.7,9,4.4%,
9.2,8,3.9%,
8.0,8,3.9%,
7.0,7,3.4%,
21.0,5,2.4%,

Value,Count,Frequency (%),Unnamed: 3
7.0,7,3.4%,
7.5,5,2.4%,
7.6,4,2.0%,
7.7,2,1.0%,
7.8,1,0.5%,

Value,Count,Frequency (%),Unnamed: 3
21.9,1,0.5%,
22.0,1,0.5%,
22.5,3,1.5%,
22.7,1,0.5%,
23.0,5,2.4%,

0,1
Distinct count,60
Unique (%),29.3%
Missing (%),1.0%
Missing (n),2
Infinite (%),0.0%
Infinite (n),0
Zeros (%),0.0%

0,1
Minimum,48.0
5-th percentile,62.0
Q1,70.0
Median,95.0
Q3,116.0
95-th percentile,181.4
Maximum,288.0
Range,240.0
Interquartile range,46.0

0,1
Standard deviation,39.714
Coef of variation,0.38093
Kurtosis,2.6233
Mean,104.26
MAD,30.505
Skewness,1.391
Sum,21164
Variance,1577.2
Memory size,1.7 KiB

Value,Count,Frequency (%),Unnamed: 3
68.0,19,9.3%,
70.0,11,5.4%,
69.0,10,4.9%,
116.0,9,4.4%,
110.0,8,3.9%,
95.0,7,3.4%,
88.0,6,2.9%,
114.0,6,2.9%,
160.0,6,2.9%,
101.0,6,2.9%,

Value,Count,Frequency (%),Unnamed: 3
48.0,1,0.5%,
52.0,2,1.0%,
55.0,1,0.5%,
56.0,2,1.0%,
58.0,1,0.5%,

Value,Count,Frequency (%),Unnamed: 3
184.0,2,1.0%,
200.0,1,0.5%,
207.0,3,1.5%,
262.0,1,0.5%,
288.0,1,0.5%,

0,1
Distinct count,24
Unique (%),11.7%
Missing (%),1.0%
Missing (n),2
Infinite (%),0.0%
Infinite (n),0
Zeros (%),0.0%

0,1
Minimum,4150
5-th percentile,4250
Q1,4800
Median,5200
Q3,5500
95-th percentile,5990
Maximum,6600
Range,2450
Interquartile range,700

0,1
Standard deviation,479.33
Coef of variation,0.093522
Kurtosis,0.056526
Mean,5125.4
MAD,385.83
Skewness,0.073237
Sum,1040400
Variance,229760
Memory size,1.7 KiB

Value,Count,Frequency (%),Unnamed: 3
5500.0,37,18.0%,
4800.0,36,17.6%,
5000.0,27,13.2%,
5200.0,23,11.2%,
5400.0,13,6.3%,
6000.0,9,4.4%,
4500.0,7,3.4%,
5800.0,7,3.4%,
5250.0,7,3.4%,
4200.0,5,2.4%,

Value,Count,Frequency (%),Unnamed: 3
4150.0,5,2.4%,
4200.0,5,2.4%,
4250.0,3,1.5%,
4350.0,4,2.0%,
4400.0,3,1.5%,

Value,Count,Frequency (%),Unnamed: 3
5750.0,1,0.5%,
5800.0,7,3.4%,
5900.0,3,1.5%,
6000.0,9,4.4%,
6600.0,2,1.0%,

0,1
Distinct count,29
Unique (%),14.1%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0
Zeros (%),0.0%

0,1
Minimum,13
5-th percentile,16
Q1,19
Median,24
Q3,30
95-th percentile,37
Maximum,49
Range,36
Interquartile range,11

0,1
Standard deviation,6.5421
Coef of variation,0.25941
Kurtosis,0.57865
Mean,25.22
MAD,5.2155
Skewness,0.6637
Sum,5170
Variance,42.8
Memory size,1.7 KiB

Value,Count,Frequency (%),Unnamed: 3
31,28,13.7%,
19,27,13.2%,
24,22,10.7%,
27,14,6.8%,
17,13,6.3%,
26,12,5.9%,
23,12,5.9%,
21,8,3.9%,
30,8,3.9%,
25,8,3.9%,

Value,Count,Frequency (%),Unnamed: 3
13,1,0.5%,
14,2,1.0%,
15,3,1.5%,
16,6,2.9%,
17,13,6.3%,

Value,Count,Frequency (%),Unnamed: 3
37,6,2.9%,
38,7,3.4%,
45,1,0.5%,
47,1,0.5%,
49,1,0.5%,

0,1
Correlation,0.97134

0,1
Distinct count,187
Unique (%),91.2%
Missing (%),2.0%
Missing (n),4
Infinite (%),0.0%
Infinite (n),0
Zeros (%),0.0%

0,1
Minimum,5118
5-th percentile,6189
Q1,7775
Median,10295
Q3,16500
95-th percentile,32528
Maximum,45400
Range,40282
Interquartile range,8725

0,1
Standard deviation,7947.1
Coef of variation,0.60173
Kurtosis,3.2315
Mean,13207
MAD,5841.2
Skewness,1.8097
Sum,2654600
Variance,63156000
Memory size,1.7 KiB

Value,Count,Frequency (%),Unnamed: 3
5572.0,2,1.0%,
6229.0,2,1.0%,
9279.0,2,1.0%,
7775.0,2,1.0%,
8845.0,2,1.0%,
8495.0,2,1.0%,
7295.0,2,1.0%,
7609.0,2,1.0%,
7957.0,2,1.0%,
13499.0,2,1.0%,

Value,Count,Frequency (%),Unnamed: 3
5118.0,1,0.5%,
5151.0,1,0.5%,
5195.0,1,0.5%,
5348.0,1,0.5%,
5389.0,1,0.5%,

Value,Count,Frequency (%),Unnamed: 3
36880.0,1,0.5%,
37028.0,1,0.5%,
40960.0,1,0.5%,
41315.0,1,0.5%,
45400.0,1,0.5%,

Unnamed: 0,symboling,wheel-base,length,width,height,curb-weight,engine-size,compression-ratio,city-mpg,highway-mpg
symboling,1.0,-0.531954,-0.357612,-0.232919,-0.541038,-0.227691,-0.10579,-0.178515,-0.035823,0.034606
wheel-base,-0.531954,1.0,0.874587,0.795144,0.589435,0.776386,0.569329,0.249786,-0.470414,-0.544082
length,-0.357612,0.874587,1.0,0.841118,0.491029,0.877728,0.68336,0.158414,-0.670909,-0.704662
width,-0.232919,0.795144,0.841118,1.0,0.27921,0.867032,0.735433,0.181129,-0.642704,-0.677218
height,-0.541038,0.589435,0.491029,0.27921,1.0,0.295572,0.067149,0.261214,-0.04864,-0.107358
curb-weight,-0.227691,0.776386,0.877728,0.867032,0.295572,1.0,0.850594,0.151362,-0.757414,-0.797465
engine-size,-0.10579,0.569329,0.68336,0.735433,0.067149,0.850594,1.0,0.028971,-0.653658,-0.67747
compression-ratio,-0.178515,0.249786,0.158414,0.181129,0.261214,0.151362,0.028971,1.0,0.324701,0.265201
city-mpg,-0.035823,-0.470414,-0.670909,-0.642704,-0.04864,-0.757414,-0.653658,0.324701,1.0,0.971337
highway-mpg,0.034606,-0.544082,-0.704662,-0.677218,-0.107358,-0.797465,-0.67747,0.265201,0.971337,1.0


### Save report to file

In [7]:
pfr = pandas_profiling.ProfileReport(df)
pfr.to_file("example2.html")

  variable_stats = pd.concat(ldesc, join_axes=pd.Index([names]), axis=1)


#### Print existing ProfileReport object inline

In [None]:
pfr

In [None]:
import os
import sys
os.path.dirname(sys.executable)