# vDataFrame[].normalize

In [None]:
vDataFrame[].normalize(method: str = "zscore", 
                       by: list = [], 
                       return_trans: bool = False)

Normalizes the input vcolumns using the input method.

### Parameters

<table id="parameters">
    <tr> <th>Name</th> <th>Type</th> <th>Optional</th> <th>Description</th> </tr>
    <tr> <td><div class="param_name">method</div></td> <td><div class="type">str</div></td> <td><div class = "yes">&#10003;</div></td> <td>Method used to normalize.<br>
                                                    <ul>
                                                        <li><b>zscore :</b> Normalization using the Z-Score (avg and std) : (x - avg) / std</li>
                                                        <li><b>robust_zscore :</b> Normalization using the Robust Z-Score (median and mad) : (x - median) / (1.4826 * mad)</li>
                                                        <li><b>minmax :</b> Normalization using the MinMax (min and max) : (x - min) / (max - min)</li>
                                                        </ul></td> </tr>
    <tr> <td><div class="param_name">by</div></td> <td><div class="type">list</div></td> <td><div class = "yes">&#10003;</div></td> <td>vcolumns used in the partition.</td> </tr>
    <tr> <td><div class="param_name">return_trans</div></td> <td><div class="type">bool</div></td> <td><div class = "yes">&#10003;</div></td> <td>If set to True, the method will return the transformation used instead of the parent vDataFrame. This parameter is used for testing purpose.</td> </tr>
</table>

### Returns

<b>vDataFrame</b> : self.parent

### Example

In [75]:
from vertica_ml_python.learn.datasets import load_titanic
titanic = load_titanic()
print(titanic["age"])

0,1
,age
0.0,2.000
1.0,30.000
2.0,25.000
3.0,39.000
4.0,71.000
,...


<object>  Name: age, Number of rows: 1234, dtype: numeric(6,3)


In [71]:
# MINMAX
titanic["age"].normalize(method = "minmax")

0,1
,age
0.0,0.0209614660474458237992154438868
1.0,0.3724111961842601243746117350614
2.0,0.3096523158026861368120729085676
3.0,0.4853771808710932126627182111777
4.0,0.8870340153131667628377878379292
,...


<object>  Name: age, Number of rows: 1234, dtype: float

In [74]:
# ZSCORE
titanic["age"].normalize(method = "zscore")

0,1
,age
0.0,-1.9502503129565278908367342155
1.0,-0.0105614239550127329564098413
2.0,-0.3569344398481404397207534796
3.0,0.6129100046526171392194087075
4.0,2.8296973063686344625112079923
,...


<object>  Name: age, Number of rows: 1234, dtype: float

In [76]:
# ZSCORE partition by pclass and survived
titanic["age"].normalize(method = "zscore", 
                         by = ["pclass", "survived"])

0,1
,age
0.0,-2.87022036418951
1.0,-0.921130872070904
2.0,-1.26918256709208
3.0,-0.294637821032781
4.0,1.93289302710277
,...


<object>  Name: age, Number of rows: 1234, dtype: float

### See Also

<table id="seealso">
    <tr><td><a href="../../main-methods/outliers">vDataFrame.outliers</a></td> <td>Computes the vDataFrame Global Outliers.</td></tr>
</table>