In [1]:
import datasense as ds
import pandas as pd

In [2]:
df = pd.DataFrame(
    {
        'x': ds.random_data(distribution='norm'),
        'y': ds.random_data(distribution='randint'),
        'z': ds.random_data(distribution='uniform'),
        't': ds.datetime_data()
    }
)

In [3]:
df.shape

(42, 4)

In [4]:
df.head()

Unnamed: 0,x,y,z,t
0,-0.098097,46,0.152227,2020-09-26 12:37:20
1,0.825161,51,0.439836,2020-09-27 12:37:20
2,-0.405795,55,0.079451,2020-09-28 12:37:20
3,1.159694,31,0.715497,2020-09-29 12:37:20
4,0.150529,34,0.820659,2020-09-30 12:37:20


In [5]:
df.dtypes

x           float64
y             int64
z           float64
t    datetime64[ns]
dtype: object

In [6]:
df.columns

Index(['x', 'y', 'z', 't'], dtype='object')

In [7]:
print(help(ds.find_int_columns))

Help on function find_int_columns in module datasense.munging:

find_int_columns(df: pandas.core.frame.DataFrame) -> List[str]
    Find all integer columns in a dataframe.
    
    Parameters
    ----------
    df : pd.DataFrame
        The input dataframe.
    
    Returns
    -------
    columns_int : List[str]
        A list of integer column names.
    
    Example
    -------
    >>> import datasense as ds
    >>> import pandas as pd
    >>> df = pd.DataFrame(
    >>>     {
    >>>         'x': ds.random_data(distribution='norm'),
    >>>         'y': ds.random_data(distribution='randint'),
    >>>         'z': ds.random_data(distribution='uniform'),
    >>>         't': ds.datetime_data()
    >>>     }
    >>> )
    >>> columns_int = ds.find_int_columns(df=df)
    >>> print(columns_int)
    ['y']

None


In [8]:
columns_int = ds.find_int_columns(df=df)
print(columns_int)

['y']


In [9]:
print(help(ds.find_int_float_columns))

Help on function find_int_float_columns in module datasense.munging:

find_int_float_columns(df: pandas.core.frame.DataFrame) -> List[str]
    Find all integer and float columns in a dataframe.
    
    Parameters
    ----------
    df : pd.DataFrame
        The input dataframe.
    
    Returns
    -------
    columns_int_float : List[str]
        A list of integer and float column names.
    
    Example
    -------
    >>> import datasense as ds
    >>> import pandas as pd
    >>> df = pd.DataFrame(
    >>>     {
    >>>         'x': ds.random_data(distribution='norm'),
    >>>         'y': ds.random_data(distribution='randint'),
    >>>         'z': ds.random_data(distribution='uniform'),
    >>>         't': ds.datetime_data()
    >>>     }
    >>> )
    >>> columns_int_float = ds.find_int_float_columns(df=df)
    >>> print(columns_int_float)
    ['x', 'y', 'z']

None


In [10]:
columns_int_float = ds.find_int_float_columns(df=df)
print(columns_int_float)

['x', 'y', 'z']


In [11]:
columns_int = list(df.select_dtypes(include=['int64']).columns)

In [12]:
columns_int_float = list(df.select_dtypes(include=['int64', 'float64']).columns)

In [13]:
print(columns_int)

['y']


In [14]:
print(columns_int_float)

['x', 'y', 'z']


In [15]:
df = ds.dataframe_info(
    df=df,
    filein='test'
)

--------------------------
DataFrame information for: test

Rows total        : 42
Rows empty        : 0 (deleted)
Rows not empty    : 42
Columns total     : 4
Columns empty     : 0 (deleted)
Columns not empty : 4

Information about non-empty columns
 Column   Data type        Empty cell count   Empty cell percentage 
-------- ---------------- ------------------ -----------------------
 x        float64                         0                     0.0 
 y        int64                           0                     0.0 
 z        float64                         0                     0.0 
 t        datetime64[ns]                  0                     0.0 

List of 4 non-empty columns:
t, x, y, z

List of 2 float columns:
x, z

List of 1 integer columns:
y

List of 1 datetime columns:
t

List of 0 string columns:

List of 0 empty columns:

