# vDataFrame[].describe

In [None]:
vDataFrame[].describe(method: str = "auto", 
                      max_cardinality: int = 6,
                      numcol: str = "")

Aggregates the vcolumn using multiple statistical aggregations: min, max, median, unique... depending on the input method.

### Parameters

<table id="parameters">
    <tr> <th>Name</th> <th>Type</th> <th>Optional</th> <th>Description</th> </tr>
    <tr> <td><div class="param_name">method</div></td> <td><div class="type">str</div></td> <td><div class = "yes">&#10003;</div></td> <td>The describe method.<br>
                                                    <ul>
                                                        <li><b>auto :</b> Sets the method to 'numerical' if the vcolumn is numerical, 'categorical' otherwise.</li>
                                                        <li><b>categorical :</b> Uses only categorical aggregations during the computation.</li>
                                                        <li><b>cat_stats :</b> Computes statistics of a numerical column for each vcolumn category. In this case, the parameter 'numcol' must be defined.</li>
                                                        <li><b>numerical :</b> Uses popular numerical aggregations during the computation.</li>
                                                    </ul></td> </tr>
    <tr> <td><div class="param_name">max_cardinality</div></td> <td><div class="type">int</div></td> <td><div class = "yes">&#10003;</div></td> <td>Cardinality threshold used to determine if the vcolumn will be considered as categorical.</td> </tr>
    <tr> <td><div class="param_name">numcol</div></td> <td><div class="type">str</div></td> <td><div class = "yes">&#10003;</div></td> <td>Numerical vcolumn to use when the parameter method is set to 'cat_stats'.</td> </tr>
</table>

### Returns

<a href="../../../utilities/tablesample">tablesample</a> : An object containing the result. For more information, check out <a href="../../../utilities/tablesample">utilities.tablesample</a>.

### Example

In [4]:
from vertica_ml_python.learn.datasets import load_market
market = load_market()
print(market)

0,1,2,3
,Form,Price,Name
0.0,Fresh,1.1193087167,Acorn squash
1.0,Fresh,1.1722478842,Acorn squash
2.0,Fresh,1.56751539145,Apples
3.0,Fresh,1.6155336441,Apples
4.0,Frozen,0.5104657455,Apples
,...,...,...


<object>  Name: market, Number of rows: 314, Number of columns: 3


In [7]:
market["Price"].describe(method = "numerical")

0,1
,value
name,"""Price"""
dtype,float
unique,308.0
count,314
mean,2.07751098603612
std,1.51037749575861
min,0.3166387792
25%,1.072761874325
50%,1.566898080825


<object>

In [10]:
# Only the count of the 3 most occurent categories will be displayed
market["Form"].describe(method = "categorical",
                        max_cardinality = 3)

0,1
,value
name,"""Form"""
dtype,varchar(32)
unique,37.0
Fresh,90
Others,90
Frozen,57
Canned,47


<object>

In [11]:
# Statistics of 'Price' partitioned by 'Form' 
market["Form"].describe(method = "cat_stats", 
                        numcol = "Price")

0,1,2,3,4,5,6,7,8,9,10,11
,count,percent,mean,std,min,10%,25%,50%,75%,90%,max
"Beefsteak,",1,0.318471337579617834,3.15921213872,,3.15921213872,3.15921213872,3.15921213872,3.15921213872,3.15921213872,3.15921213872,3.15921213872
Boiled,2,0.636942675159235669,3.830154965845,0.0050356546423244,3.8265942203,3.827306369409,3.8283745930725,3.830154965845,3.8319353386175,3.833003562281,3.83371571139
Canned,47,14.968152866242038217,1.1649022634076,0.595638890885002,0.7843472032,0.8428270506668,0.902851046936,0.965253514158,1.12269898745,1.38030526322,3.38561047493
"Canned,",2,0.636942675159235669,4.63647686809,0.635894274349174,4.18683171458,4.276760745282,4.411654291335,4.63647686809,4.861299444845,4.996192990898,5.0861220216
"Canned, packed in syrup or water",2,0.636942675159235669,3.622330820065,0.146494766407389,3.51874337733,3.539460865877,3.5705370986975,3.622330820065,3.6741245414325,3.705200774253,3.7259182628
Cooked whole,2,0.636942675159235669,0.7576457039395,0.0227769157205302,0.741539992379,0.7447611346911,0.74959284815925,0.7576457039395,0.76569855971975,0.7705302731879,0.7737514155
Dried,30,9.554140127388535032,3.711283795031,2.60822802642759,1.085109083,1.40199224367,1.5408802667725,1.975096291315,5.5080500887675,7.371265288069,10.1637125484
Dried (Prunes),2,0.636942675159235669,4.38513566562,0.493264261155465,4.03634516164,4.106103262436,4.21074041363,4.38513566562,4.55953091761,4.664168068804,4.7339261696
Florets,4,1.273885350318471338,2.83238728437,0.435863589578331,2.3624557989,2.424260489439,2.5169675252475,2.848222451715,3.1636422108375,3.227845945425,3.27064843515


<object>

### See Also

<table id="seealso">
    <tr><td><a href="../../main-methods/agg">vDataFrame.aggregate</a></td> <td>Computes the vDataFrame input aggregations.</td></tr>
</table>