### Vaex- Reading And Processing Huge Datasets in seconds

### What is Vaex?
Vaex is a high performance Python library for lazy Out-of-Core DataFrames (similar to Pandas), to visualize and explore big tabular datasets. It calculates statistics such as mean, sum, count, standard deviation etc, on an N-dimensional grid for more than a billion (10^9) samples/rows per second. Visualization is done using histograms, density plots and 3d volume rendering, allowing interactive exploration of big data. Vaex uses memory mapping, zero memory copy policy and lazy computations for best performance (no memory wasted).

In [1]:
#pip install vaex

In [2]:
import vaex
import pandas as pd
import numpy as np


In [3]:
np.random.randint(0, 100, size=(2, 5))

array([[18, 45,  5, 80, 37],
       [13, 39, 13, 93, 55]])

In [4]:
#create dataset 

n_rows = 1000000
n_cols = 500
df = pd.DataFrame(np.random.randint(0, 100, size=(n_rows, n_cols)), columns=['col%d' % i for i in range(n_cols)])
df.head()

Unnamed: 0,col0,col1,col2,col3,col4,col5,col6,col7,col8,col9,...,col490,col491,col492,col493,col494,col495,col496,col497,col498,col499
0,98,10,87,81,97,91,31,70,42,30,...,57,10,88,16,66,41,12,50,49,15
1,67,96,52,66,29,12,77,96,28,41,...,6,89,94,79,16,96,86,59,88,28
2,29,57,98,15,60,80,71,89,63,26,...,41,61,32,91,62,27,43,14,59,80
3,18,62,81,94,11,35,54,97,0,27,...,17,25,50,21,94,32,86,24,8,11
4,22,14,13,3,24,3,47,89,2,15,...,27,73,60,45,7,22,52,56,87,65


In [5]:
df.info(memory_usage='deep')

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 1000000 entries, 0 to 999999
Columns: 500 entries, col0 to col499
dtypes: int32(500)
memory usage: 1.9 GB


### Creating Csv files

In [6]:

file_path = 'final_data.csv'
df.to_csv(file_path, index=False)

### Create Hdf5 files :  is a set of file formats (HDF4, HDF5) designed to store and organize large amounts of data.

In [7]:
%%time

vaex_df = vaex.from_csv(file_path, convert=True, chunk_size=5_000_000)

Wall time: 399 ms


In [8]:
%%time
# compare time taken to import from csv using vaex and pandas

pd_df = pd.read_csv(file_path)

# loading was faster using pandas

Wall time: 39.7 s


In [9]:
type(vaex_df)

vaex.hdf5.dataset.Hdf5MemoryMapped

### Read Hdf5 files using Vaex library

In [10]:
vaex_df = vaex.open('final_data.csv.hdf5')

In [11]:
type(vaex_df)

vaex.hdf5.dataset.Hdf5MemoryMapped

In [12]:
vaex_df.head()

#,col0,col1,col2,col3,col4,col5,col6,col7,col8,col9,col10,col11,col12,col13,col14,col15,col16,col17,col18,col19,col20,col21,col22,col23,col24,col25,col26,col27,col28,col29,col30,col31,col32,col33,col34,col35,col36,col37,col38,col39,col40,col41,col42,col43,col44,col45,col46,col47,col48,col49,col50,col51,col52,col53,col54,col55,col56,col57,col58,col59,col60,col61,col62,col63,col64,col65,col66,col67,col68,col69,col70,col71,col72,col73,col74,col75,col76,col77,col78,col79,col80,col81,col82,col83,col84,col85,col86,col87,col88,col89,col90,col91,col92,col93,col94,col95,col96,col97,col98,col99,col100,col101,col102,col103,col104,col105,col106,col107,col108,col109,col110,col111,col112,col113,col114,col115,col116,col117,col118,col119,col120,col121,col122,col123,col124,col125,col126,col127,col128,col129,col130,col131,col132,col133,col134,col135,col136,col137,col138,col139,col140,col141,col142,col143,col144,col145,col146,col147,col148,col149,col150,col151,col152,col153,col154,col155,col156,col157,col158,col159,col160,col161,col162,col163,col164,col165,col166,col167,col168,col169,col170,col171,col172,col173,col174,col175,col176,col177,col178,col179,col180,col181,col182,col183,col184,col185,col186,col187,col188,col189,col190,col191,col192,col193,col194,col195,col196,col197,col198,col199,col200,col201,col202,col203,col204,col205,col206,col207,col208,col209,col210,col211,col212,col213,col214,col215,col216,col217,col218,col219,col220,col221,col222,col223,col224,col225,col226,col227,col228,col229,col230,col231,col232,col233,col234,col235,col236,col237,col238,col239,col240,col241,col242,col243,col244,col245,col246,col247,col248,col249,col250,col251,col252,col253,col254,col255,col256,col257,col258,col259,col260,col261,col262,col263,col264,col265,col266,col267,col268,col269,col270,col271,col272,col273,col274,col275,col276,col277,col278,col279,col280,col281,col282,col283,col284,col285,col286,col287,col288,col289,col290,col291,col292,col293,col294,col295,col296,col297,col298,col299,col300,col301,col302,col303,col304,col305,col306,col307,col308,col309,col310,col311,col312,col313,col314,col315,col316,col317,col318,col319,col320,col321,col322,col323,col324,col325,col326,col327,col328,col329,col330,col331,col332,col333,col334,col335,col336,col337,col338,col339,col340,col341,col342,col343,col344,col345,col346,col347,col348,col349,col350,col351,col352,col353,col354,col355,col356,col357,col358,col359,col360,col361,col362,col363,col364,col365,col366,col367,col368,col369,col370,col371,col372,col373,col374,col375,col376,col377,col378,col379,col380,col381,col382,col383,col384,col385,col386,col387,col388,col389,col390,col391,col392,col393,col394,col395,col396,col397,col398,col399,col400,col401,col402,col403,col404,col405,col406,col407,col408,col409,col410,col411,col412,col413,col414,col415,col416,col417,col418,col419,col420,col421,col422,col423,col424,col425,col426,col427,col428,col429,col430,col431,col432,col433,col434,col435,col436,col437,col438,col439,col440,col441,col442,col443,col444,col445,col446,col447,col448,col449,col450,col451,col452,col453,col454,col455,col456,col457,col458,col459,col460,col461,col462,col463,col464,col465,col466,col467,col468,col469,col470,col471,col472,col473,col474,col475,col476,col477,col478,col479,col480,col481,col482,col483,col484,col485,col486,col487,col488,col489,col490,col491,col492,col493,col494,col495,col496,col497,col498,col499
0,97,6,48,80,3,59,19,18,68,26,13,92,89,23,94,69,14,11,79,10,7,71,83,46,67,98,27,80,64,38,0,18,15,17,12,29,92,57,61,39,55,67,32,95,81,76,52,79,2,57,9,29,2,13,66,46,92,48,32,61,43,97,73,45,83,52,44,77,30,72,55,7,43,21,50,70,79,73,76,56,81,33,21,27,14,73,92,55,1,93,80,20,94,32,81,51,18,25,85,14,50,48,92,46,21,19,31,6,35,3,30,10,88,61,20,39,49,30,34,94,59,27,70,35,8,83,61,53,94,67,80,89,82,16,7,49,44,26,10,34,19,39,89,63,81,69,40,6,9,21,82,69,29,98,56,95,63,77,27,96,14,43,73,14,63,24,8,54,21,66,95,34,3,30,50,89,32,0,29,40,78,53,47,87,90,89,76,6,96,2,4,81,29,9,82,3,27,78,60,37,36,53,55,61,81,2,55,94,77,65,54,60,45,12,46,13,27,55,45,95,65,52,77,56,18,9,8,94,99,31,76,10,90,47,40,99,82,13,61,18,77,77,82,11,77,93,64,9,5,15,97,97,18,18,89,65,5,64,66,72,35,31,70,87,4,5,22,11,88,58,18,38,7,44,18,77,4,37,83,54,27,70,82,22,81,24,91,69,27,51,5,37,65,53,48,12,49,92,73,89,89,88,87,14,75,66,90,39,43,49,9,11,20,25,38,75,90,79,17,53,47,69,62,70,87,79,3,63,38,12,62,18,47,44,63,34,15,59,95,19,39,25,19,83,50,40,7,45,16,76,79,81,22,33,52,91,17,48,53,87,67,66,33,20,49,67,74,49,88,4,26,1,75,96,99,11,61,16,97,82,81,10,27,78,78,0,74,3,32,18,39,44,52,39,25,79,33,45,2,14,24,37,74,32,87,26,1,67,78,5,94,1,7,19,62,3,93,97,78,63,4,44,56,77,55,27,58,13,65,71,26,24,11,36,58,77,13,42,59,67,89,1,16,20,72,77,18,70,79,42,94,11,40,56,47,25,45,64,83,23,88,36,95,5,66,38,61,80,36,42,20,16,56,63,15,79,90,85,95,61,55,53,72,64,1,22,84,58,62,37,87,33,36,27,39,32,1,34,31,1
1,8,24,31,36,55,97,99,77,76,21,85,0,26,97,60,59,84,99,7,10,40,76,35,59,40,81,49,98,53,54,68,42,46,49,55,78,60,48,19,41,53,82,78,24,12,51,89,76,10,93,90,12,54,63,51,74,27,30,88,97,83,80,46,27,7,68,80,27,1,36,9,21,99,46,5,94,54,13,94,56,91,69,70,26,2,43,56,20,46,3,76,68,30,9,81,92,17,15,48,73,64,85,89,53,31,47,8,86,43,88,74,58,47,96,99,17,16,77,9,53,89,48,41,22,89,89,48,5,44,89,59,86,61,29,55,27,35,24,3,65,73,18,32,18,73,71,56,24,16,61,62,53,20,28,58,92,79,71,99,95,80,10,3,74,30,5,36,14,53,81,67,33,48,87,9,45,40,70,18,68,70,89,73,39,14,62,49,61,74,5,80,13,60,43,92,27,70,89,74,43,39,66,28,94,27,21,62,36,79,89,89,61,48,73,82,55,60,32,48,90,92,35,81,58,33,22,28,80,24,86,7,80,41,38,68,72,1,69,54,56,73,47,62,40,40,22,76,42,79,83,26,94,19,3,67,42,24,20,40,10,5,35,40,28,80,57,85,96,55,67,89,63,2,10,31,70,1,10,20,27,56,71,50,67,21,67,10,34,39,83,54,59,82,11,29,33,80,98,40,0,91,11,72,52,71,6,31,14,17,31,40,88,22,29,79,11,42,41,95,21,75,78,40,63,59,34,72,14,55,81,62,26,55,83,4,90,70,27,14,53,90,93,8,80,93,74,54,89,84,68,51,71,80,79,82,70,89,74,61,46,95,49,38,48,29,31,7,26,86,38,76,74,75,13,24,48,97,51,79,73,20,32,77,28,77,43,17,23,65,86,70,25,60,64,88,34,27,12,89,71,25,99,44,75,62,82,16,80,54,27,9,13,33,60,16,84,91,29,38,19,36,50,16,71,99,93,97,86,5,19,55,20,19,15,77,52,86,69,86,17,90,1,88,21,87,66,59,23,12,98,65,52,48,72,92,37,26,95,83,23,52,29,47,58,55,75,28,0,9,65,59,18,9,61,89,33,75,49,14,58,32,81,1,73,61,91,58,36,67,75,41,6,43,32,66,83,34,57,22,79
2,36,78,24,15,78,69,72,7,96,31,18,40,14,3,7,85,40,48,57,69,77,35,47,64,12,51,50,5,73,85,48,7,72,4,96,42,47,83,43,38,45,76,30,42,7,21,34,85,50,72,8,90,80,33,52,42,31,86,91,3,21,90,68,64,51,52,75,98,60,3,33,11,57,27,88,55,95,15,35,6,40,91,25,36,54,45,59,70,68,50,32,7,3,83,87,9,40,32,35,99,23,21,83,12,35,86,49,81,70,96,22,97,74,85,45,5,77,61,38,38,81,97,15,62,25,10,30,32,75,82,27,83,26,92,13,91,23,58,20,63,17,49,69,95,96,51,54,49,2,83,45,76,20,33,75,45,11,80,87,29,99,55,51,39,8,31,87,90,88,46,79,13,81,1,43,58,1,91,23,1,75,67,76,53,4,34,19,71,6,40,86,24,98,29,49,34,80,42,26,30,71,90,37,84,49,78,6,53,27,78,28,71,55,34,27,71,55,88,52,87,97,63,50,88,39,5,96,73,20,33,84,61,9,93,70,68,74,56,88,76,52,21,91,80,17,20,20,39,66,50,86,19,26,34,91,79,38,47,45,24,80,97,47,10,21,68,25,39,93,91,76,55,85,27,90,3,39,74,78,61,40,0,56,64,46,20,22,24,78,82,24,18,41,11,58,63,99,65,63,91,50,94,92,96,62,73,25,37,20,2,55,31,43,15,71,89,65,60,64,54,24,1,84,15,65,51,49,25,12,82,59,92,75,56,37,58,8,37,92,42,90,6,2,72,62,56,25,86,60,77,68,91,57,36,78,76,60,70,62,79,13,97,5,88,88,0,90,66,15,5,43,26,63,29,73,64,64,49,70,61,32,67,25,0,17,71,42,80,98,26,67,0,64,34,73,83,68,46,99,51,31,87,51,68,47,6,1,98,28,82,60,31,88,69,44,42,14,70,54,86,27,91,49,49,25,86,34,50,90,36,92,4,39,17,49,2,21,52,56,51,96,29,83,59,91,18,99,15,44,88,56,26,92,57,30,36,73,92,75,53,38,24,83,2,1,83,15,44,96,10,8,84,15,47,70,46,82,88,41,32,89,42,29,21,87,17,60,82,16,29,96,73,61,13,33,28,79,51,90,20
3,15,54,61,33,4,55,89,38,89,74,62,38,3,89,76,51,48,13,92,33,84,2,31,27,43,23,67,7,32,25,71,29,12,63,38,39,45,33,31,11,88,68,99,47,40,27,51,60,31,91,62,93,87,73,45,81,58,54,47,53,21,36,27,58,57,39,45,88,61,66,16,35,41,5,33,9,64,57,59,41,63,71,11,24,63,60,47,19,27,65,71,54,18,57,6,36,50,63,91,3,53,77,7,47,20,92,33,57,67,59,15,74,69,53,75,50,15,56,27,10,92,20,31,3,89,36,77,53,62,78,15,65,78,73,64,19,84,21,80,29,94,33,72,88,67,45,45,58,61,74,97,54,39,52,52,97,93,93,82,37,11,22,14,56,20,32,98,10,37,77,30,29,19,95,89,36,22,64,91,55,5,39,97,46,21,6,3,9,23,6,66,31,72,36,1,99,10,24,83,67,65,82,98,46,14,0,67,32,66,9,66,69,58,41,94,30,43,10,31,5,26,8,86,93,12,12,81,55,16,4,54,7,82,11,73,16,70,48,35,45,61,58,62,64,23,33,9,62,17,89,70,78,31,78,3,37,3,29,16,0,17,33,78,60,72,73,50,76,97,17,27,37,19,51,45,4,7,67,35,92,50,71,3,97,23,89,30,94,35,13,5,30,56,60,52,32,95,24,12,23,67,58,34,7,63,89,64,43,89,84,44,98,2,58,69,42,30,67,3,70,76,24,29,31,35,7,80,81,53,74,7,98,92,56,75,52,64,51,73,13,87,21,71,80,52,6,6,91,14,0,33,14,63,36,70,89,48,97,21,28,83,69,38,57,88,4,78,42,8,87,25,21,81,28,15,8,99,42,14,32,84,52,80,91,64,77,19,96,96,1,74,37,36,41,25,63,56,1,75,91,97,99,33,59,37,3,70,89,58,83,0,98,75,80,48,39,7,65,31,92,9,93,24,67,36,62,55,17,68,50,47,33,69,63,34,95,4,78,46,13,68,56,83,4,2,46,25,6,30,38,10,76,21,11,40,73,47,71,9,20,22,81,39,61,78,66,55,22,68,59,35,66,42,43,87,80,67,54,7,79,43,46,40,42,59,0,13,90,62,81,5,67,78,75,3,0,36,14,24,61
4,15,57,73,53,67,56,67,67,20,47,57,56,18,81,94,6,76,37,69,69,61,1,30,97,3,85,64,79,58,67,13,14,25,27,76,6,76,90,34,14,69,88,4,10,42,23,49,92,17,35,81,86,8,34,84,60,26,54,20,65,90,68,56,55,91,3,60,40,63,47,47,82,21,82,57,6,74,56,40,1,14,81,98,29,25,31,4,9,82,75,45,45,30,57,33,17,59,29,11,25,0,2,19,5,12,31,48,33,65,80,53,17,12,31,48,36,38,88,65,15,70,19,41,29,66,5,39,21,82,94,89,75,82,31,45,52,29,83,49,77,33,36,52,3,88,55,51,0,6,69,81,57,71,88,5,98,87,26,83,48,8,78,74,72,10,93,45,84,87,95,7,86,14,10,82,46,30,3,78,97,78,7,34,61,20,98,22,26,44,44,58,93,33,29,42,45,8,3,65,68,74,70,52,77,86,44,17,15,61,30,19,9,56,30,64,64,91,4,76,70,78,39,43,91,81,72,26,44,42,76,46,45,61,28,7,6,58,72,36,80,42,55,90,0,48,61,5,91,51,43,72,55,44,37,0,1,90,9,6,81,29,0,81,40,30,18,25,54,25,88,16,86,43,49,8,79,1,77,45,92,25,32,66,48,67,48,73,57,78,95,9,77,89,10,52,76,42,56,58,79,45,18,9,51,42,86,14,37,38,30,18,74,29,77,82,35,64,15,28,47,64,25,53,80,84,14,90,6,74,67,57,79,83,37,99,10,5,85,43,78,94,72,2,26,16,14,63,73,11,56,31,38,37,48,94,51,26,95,66,77,66,91,58,43,56,17,89,79,56,3,75,51,74,49,4,59,62,39,42,26,37,29,69,24,7,2,9,32,6,38,92,0,47,92,39,76,17,12,10,92,93,4,93,96,54,83,87,90,65,26,32,47,33,59,85,16,41,5,58,49,18,43,28,94,16,31,86,42,72,63,70,35,13,61,52,81,7,57,1,53,69,52,47,4,50,2,46,94,47,32,87,63,71,86,71,36,29,52,68,50,28,99,37,85,82,76,49,83,40,22,58,18,12,28,48,70,23,54,33,15,71,38,32,39,60,91,56,94,53,84,98,50,16,97,4,15,25,22,75,93
5,55,90,23,39,8,9,62,90,23,59,0,61,9,28,40,75,7,74,70,34,41,34,43,61,78,87,82,70,16,12,37,14,60,88,2,54,88,85,11,67,36,15,22,68,55,1,97,23,68,43,61,34,3,41,69,57,77,83,79,68,44,18,85,11,83,52,46,78,94,70,67,6,21,83,39,36,97,12,96,38,84,0,13,16,64,77,14,86,53,24,92,52,81,12,81,77,95,51,81,88,55,40,14,31,38,69,66,43,10,93,12,44,34,29,10,13,83,38,13,27,85,2,60,4,88,61,63,25,45,1,33,4,30,52,86,33,34,24,14,87,27,26,6,65,99,10,63,56,72,68,82,77,72,60,62,3,83,87,38,65,30,32,9,93,96,14,31,92,15,56,38,11,2,58,76,57,24,25,81,78,87,73,17,42,44,8,75,75,45,62,6,34,15,76,60,99,80,55,33,93,51,18,4,26,4,34,69,74,3,93,83,78,5,37,11,76,1,69,49,16,40,13,5,66,27,29,24,9,58,74,22,17,85,92,61,84,91,9,99,1,20,80,23,70,1,20,28,28,11,92,89,17,79,41,97,13,66,79,24,88,28,84,55,2,84,14,33,83,47,1,62,49,2,56,83,26,27,30,45,6,33,17,45,59,21,58,62,33,51,57,98,38,41,2,82,95,47,25,70,20,7,51,46,17,65,10,68,98,68,26,22,6,43,79,83,22,74,7,43,75,27,34,65,17,51,33,39,31,3,44,38,16,38,61,61,1,36,76,44,13,4,53,77,26,47,23,5,67,98,36,67,93,21,72,87,0,10,99,83,18,5,86,8,36,4,89,74,62,45,96,93,57,26,49,44,82,53,59,65,7,72,90,67,82,44,65,78,81,63,43,20,61,78,25,63,33,66,28,85,0,46,59,39,12,93,3,75,77,52,26,15,64,50,62,75,17,31,59,12,88,7,1,10,45,2,40,44,56,60,41,49,72,97,25,51,82,38,73,74,12,68,2,54,63,88,98,93,3,5,12,21,74,0,69,1,91,0,82,61,83,9,12,54,6,82,20,63,79,6,20,68,32,35,41,72,15,75,49,84,44,98,68,31,40,78,12,46,82,55,98,57,82,95,77,58,14,13,87,45,90
6,48,26,10,98,17,48,29,92,78,9,50,96,42,39,0,19,71,28,90,41,90,31,28,90,70,71,43,95,99,67,57,47,57,11,94,44,36,54,59,35,67,80,25,5,81,82,55,91,41,23,96,95,97,48,83,1,4,70,93,70,34,4,66,16,66,80,67,10,46,96,5,37,79,98,19,16,8,89,74,81,21,64,74,27,57,41,24,23,25,29,55,49,77,70,70,2,41,94,17,0,35,48,73,1,27,48,39,67,72,43,38,32,40,25,89,64,40,7,57,37,61,50,83,46,43,67,28,2,36,31,34,96,3,55,11,13,44,24,10,50,7,60,83,90,98,8,98,54,2,86,23,80,97,76,98,15,93,31,76,61,4,31,48,50,8,65,26,48,98,47,68,9,40,61,25,46,88,96,29,72,70,59,71,15,25,78,60,8,61,19,38,19,25,99,11,68,98,40,30,19,40,21,32,26,20,9,34,51,60,70,82,57,94,1,46,97,74,97,41,70,55,37,4,67,26,79,62,72,77,64,19,55,88,88,47,28,60,96,44,49,97,67,49,23,20,84,83,70,98,71,41,83,78,32,8,91,55,5,91,4,92,50,44,86,30,98,23,25,13,53,81,7,51,89,22,52,31,22,78,96,51,64,61,80,92,96,2,33,16,89,74,97,42,80,29,75,11,91,52,19,72,8,7,33,56,8,20,77,71,81,97,22,85,62,46,56,19,93,11,33,84,61,39,34,4,80,91,10,37,75,59,26,69,39,23,41,0,3,60,4,24,37,84,84,90,23,66,70,14,31,40,13,80,25,12,54,57,97,61,28,70,93,40,67,93,77,89,57,92,50,94,1,29,30,14,7,22,73,74,28,99,30,26,64,96,30,82,33,12,73,15,92,69,19,93,36,51,14,17,3,78,8,83,68,15,59,37,85,26,22,3,82,21,44,15,6,64,20,75,48,0,25,70,54,71,98,95,54,67,98,98,79,89,72,61,47,53,19,62,32,53,77,60,11,20,4,5,67,92,40,33,1,42,27,46,62,0,31,3,61,32,57,75,95,30,65,95,18,90,55,43,61,91,27,94,60,7,8,48,7,70,90,82,90,4,73,73,98,72,93,41,82,47,89,68,15,51,38,64,94
7,61,41,92,10,76,10,57,46,56,1,99,66,66,19,2,57,39,13,64,68,45,60,73,64,49,36,8,62,5,70,90,24,88,9,26,41,41,13,38,62,69,92,77,27,78,32,2,96,2,49,97,31,96,48,11,61,78,39,13,54,28,52,85,35,59,20,83,69,65,97,60,54,48,25,66,75,65,83,37,85,2,2,85,27,15,12,13,49,59,53,37,16,46,83,29,12,17,81,23,16,80,16,65,85,85,3,25,68,70,48,14,18,99,68,88,10,38,67,49,55,26,75,36,60,47,74,91,6,86,4,91,97,41,9,30,78,15,48,83,42,38,86,96,74,78,74,98,76,55,57,20,48,80,65,38,35,0,92,13,46,49,91,53,73,23,49,90,15,30,49,5,37,61,57,82,87,17,82,45,54,30,45,45,80,69,27,10,29,24,26,74,5,23,21,11,68,75,75,57,17,41,41,70,55,65,88,93,56,7,81,50,87,21,20,64,41,16,31,30,57,19,62,45,71,23,39,43,37,4,63,98,74,58,77,4,19,96,45,4,90,40,76,31,36,17,70,56,59,85,41,23,73,17,78,23,36,25,99,72,17,40,7,13,27,77,55,13,81,72,5,43,65,89,85,17,31,29,1,11,76,62,48,75,21,42,48,5,12,29,25,76,41,92,69,59,0,5,90,79,10,82,68,24,2,54,33,22,32,92,93,6,85,85,76,73,68,96,54,30,96,45,4,90,69,3,96,16,2,46,59,13,47,10,8,70,42,65,21,74,17,61,6,12,29,16,38,38,39,86,5,6,85,74,38,98,11,62,24,3,34,35,31,71,51,95,43,71,93,52,49,3,43,92,50,64,44,92,95,91,86,90,30,40,64,59,37,6,39,51,99,87,54,37,45,87,42,94,77,52,26,14,42,31,62,64,55,52,0,77,96,66,39,78,72,67,87,56,68,57,64,5,19,42,19,38,76,66,88,67,80,94,69,5,45,33,26,85,2,3,19,62,55,50,58,43,68,79,90,9,5,42,94,94,2,70,93,66,31,52,79,76,0,62,42,8,53,73,45,87,14,51,26,62,50,71,44,90,2,3,50,94,27,56,63,11,25,3,82,58,70,73,27,96,29,94,53,42,53,80,51
8,34,44,55,15,1,29,20,21,29,18,6,85,64,71,16,42,74,22,13,19,50,19,83,9,15,26,99,99,13,20,36,91,84,81,55,24,30,93,15,60,34,28,23,82,89,84,28,51,95,50,72,99,25,50,18,39,56,58,49,46,9,44,89,69,17,0,82,31,9,84,29,56,40,42,53,51,96,67,39,6,59,54,93,38,43,11,11,32,73,48,23,85,93,43,8,38,50,12,61,60,85,40,51,22,44,6,78,65,13,14,85,58,8,51,73,74,46,52,37,87,3,70,78,91,7,4,7,58,17,96,9,89,70,3,50,28,60,56,61,80,89,41,56,98,47,68,45,15,13,93,20,66,30,89,20,34,80,97,45,55,10,20,56,66,43,90,78,13,73,35,49,87,75,47,24,8,61,31,39,60,82,59,17,87,37,23,65,17,83,3,1,77,20,23,18,77,36,51,36,93,53,82,76,1,24,67,89,98,74,11,37,11,69,48,70,10,20,49,34,60,74,34,10,88,30,25,33,95,74,91,59,80,29,96,26,62,92,67,72,44,92,42,74,49,44,7,44,27,48,96,68,27,62,30,60,0,53,87,8,96,35,79,65,88,81,4,43,84,30,45,49,39,88,60,52,26,85,39,54,80,25,58,51,89,34,80,21,74,74,99,67,42,73,5,70,22,81,84,96,11,48,7,54,46,53,34,99,11,71,81,5,75,65,46,47,42,14,29,62,59,16,6,39,91,13,79,31,89,84,91,10,49,34,58,9,78,39,15,71,43,74,15,95,77,2,13,65,15,0,71,52,91,29,20,33,9,39,84,39,84,58,3,48,71,83,93,0,19,26,15,9,10,36,77,66,45,78,25,61,95,71,53,85,89,10,44,9,33,90,39,3,69,84,23,69,47,59,78,42,35,1,49,35,32,25,36,12,7,16,63,53,99,82,36,99,19,99,65,65,2,60,79,70,24,92,54,28,68,90,54,68,87,28,79,74,16,14,60,9,10,96,77,98,9,45,51,13,71,79,1,3,30,43,32,62,67,66,56,33,26,91,27,36,80,55,22,5,27,77,58,76,46,91,67,43,73,31,52,92,88,99,56,8,8,68,8,40,83,66,92,7,64,7,74,13,49,47,58,26,94
9,65,31,58,50,35,67,93,7,5,70,92,97,15,59,25,18,24,53,28,42,70,90,7,45,81,25,10,73,96,77,4,9,53,30,42,69,16,60,59,95,16,31,71,99,80,93,11,17,52,72,86,48,14,50,9,78,34,76,52,87,60,49,96,38,85,72,95,38,23,88,76,91,49,52,6,76,85,29,79,71,25,72,69,80,66,47,62,78,49,16,80,10,97,92,66,36,46,85,18,78,28,11,43,86,29,86,69,5,18,2,99,6,84,31,21,52,34,58,76,66,64,12,51,89,6,68,22,93,97,63,54,33,48,72,86,28,16,63,20,91,80,21,35,68,40,56,33,22,32,10,61,63,60,55,30,50,85,87,82,36,39,90,87,83,94,77,37,57,66,73,60,19,40,88,1,2,61,88,56,31,55,55,43,25,8,0,7,29,78,16,51,5,29,46,70,22,4,46,25,31,8,28,48,80,85,20,87,42,91,70,79,80,22,47,70,3,12,76,23,30,66,89,63,89,85,32,88,11,26,51,66,2,0,11,62,76,44,95,9,52,5,62,60,86,17,59,33,15,3,14,8,65,88,69,27,72,94,47,93,35,55,51,68,47,71,28,60,48,98,13,55,35,64,75,32,67,4,33,95,1,84,51,43,72,73,72,50,48,37,55,23,45,53,68,99,71,57,3,88,15,37,69,55,0,30,19,69,24,71,36,82,15,35,95,61,56,67,40,64,68,31,15,83,99,84,74,75,81,39,53,11,60,26,74,82,77,60,16,84,48,33,37,83,23,97,91,52,26,84,92,98,83,14,1,61,24,16,26,91,14,63,19,43,61,82,72,93,5,62,84,47,18,12,89,41,1,52,77,90,14,30,48,89,7,36,55,61,42,27,91,31,40,34,36,41,88,17,14,78,6,49,37,1,48,88,22,51,36,72,64,62,44,77,8,97,45,30,95,94,24,81,43,47,54,8,25,43,98,64,75,80,74,25,34,73,59,9,4,70,28,14,63,67,96,79,84,61,84,66,3,72,73,77,35,50,36,33,7,64,31,43,90,6,40,44,73,48,45,37,99,73,13,49,66,24,37,30,95,14,35,27,13,53,58,75,80,94,50,16,55,62,43,8,44,89,38,67,73,52,83


### Expression system
Don't waste memory or time with feature engineering, we (lazily) transform your data when needed.

In [13]:
%%time
vaex_df['multiplication_col13']=vaex_df.col1*vaex_df.col3

Wall time: 0 ns


In [14]:
%%time
pd_df['multiplication_col13']=pd_df.col1*pd_df.col3

# pandas is slower

Wall time: 28 ms


In [15]:
vaex_df['multiplication_col13']

Expression = multiplication_col13
Length: 1,000,000 dtype: int64 (column)
---------------------------------------
     0   480
     1   864
     2  1170
     3  1782
     4  3021
    ...     
999995   444
999996   585
999997  2324
999998   142
999999  7047

### Out-of-core DataFrame
Filtering and evaluating expressions will not waste memory by making copies; the data is kept untouched on disk, and will be streamed only when needed. Delay the time before you need a cluster.

In [16]:
%%time
vaex_df[vaex_df.col2>70]

Wall time: 97 ms


#,col0,col1,col2,col3,col4,col5,col6,col7,col8,col9,col10,col11,col12,col13,col14,col15,col16,col17,col18,col19,col20,col21,col22,col23,col24,col25,col26,col27,col28,col29,col30,col31,col32,col33,col34,col35,col36,col37,col38,col39,col40,col41,col42,col43,col44,col45,col46,col47,col48,col49,col50,col51,col52,col53,col54,col55,col56,col57,col58,col59,col60,col61,col62,col63,col64,col65,col66,col67,col68,col69,col70,col71,col72,col73,col74,col75,col76,col77,col78,col79,col80,col81,col82,col83,col84,col85,col86,col87,col88,col89,col90,col91,col92,col93,col94,col95,col96,col97,col98,col99,col100,col101,col102,col103,col104,col105,col106,col107,col108,col109,col110,col111,col112,col113,col114,col115,col116,col117,col118,col119,col120,col121,col122,col123,col124,col125,col126,col127,col128,col129,col130,col131,col132,col133,col134,col135,col136,col137,col138,col139,col140,col141,col142,col143,col144,col145,col146,col147,col148,col149,col150,col151,col152,col153,col154,col155,col156,col157,col158,col159,col160,col161,col162,col163,col164,col165,col166,col167,col168,col169,col170,col171,col172,col173,col174,col175,col176,col177,col178,col179,col180,col181,col182,col183,col184,col185,col186,col187,col188,col189,col190,col191,col192,col193,col194,col195,col196,col197,col198,col199,col200,col201,col202,col203,col204,col205,col206,col207,col208,col209,col210,col211,col212,col213,col214,col215,col216,col217,col218,col219,col220,col221,col222,col223,col224,col225,col226,col227,col228,col229,col230,col231,col232,col233,col234,col235,col236,col237,col238,col239,col240,col241,col242,col243,col244,col245,col246,col247,col248,col249,col250,col251,col252,col253,col254,col255,col256,col257,col258,col259,col260,col261,col262,col263,col264,col265,col266,col267,col268,col269,col270,col271,col272,col273,col274,col275,col276,col277,col278,col279,col280,col281,col282,col283,col284,col285,col286,col287,col288,col289,col290,col291,col292,col293,col294,col295,col296,col297,col298,col299,col300,col301,col302,col303,col304,col305,col306,col307,col308,col309,col310,col311,col312,col313,col314,col315,col316,col317,col318,col319,col320,col321,col322,col323,col324,col325,col326,col327,col328,col329,col330,col331,col332,col333,col334,col335,col336,col337,col338,col339,col340,col341,col342,col343,col344,col345,col346,col347,col348,col349,col350,col351,col352,col353,col354,col355,col356,col357,col358,col359,col360,col361,col362,col363,col364,col365,col366,col367,col368,col369,col370,col371,col372,col373,col374,col375,col376,col377,col378,col379,col380,col381,col382,col383,col384,col385,col386,col387,col388,col389,col390,col391,col392,col393,col394,col395,col396,col397,col398,col399,col400,col401,col402,col403,col404,col405,col406,col407,col408,col409,col410,col411,col412,col413,col414,col415,col416,col417,col418,col419,col420,col421,col422,col423,col424,col425,col426,col427,col428,col429,col430,col431,col432,col433,col434,col435,col436,col437,col438,col439,col440,col441,col442,col443,col444,col445,col446,col447,col448,col449,col450,col451,col452,col453,col454,col455,col456,col457,col458,col459,col460,col461,col462,col463,col464,col465,col466,col467,col468,col469,col470,col471,col472,col473,col474,col475,col476,col477,col478,col479,col480,col481,col482,col483,col484,col485,col486,col487,col488,col489,col490,col491,col492,col493,col494,col495,col496,col497,col498,col499,multiplication_col13
0,15,57,73,53,67,56,67,67,20,47,57,56,18,81,94,6,76,37,69,69,61,1,30,97,3,85,64,79,58,67,13,14,25,27,76,6,76,90,34,14,69,88,4,10,42,23,49,92,17,35,81,86,8,34,84,60,26,54,20,65,90,68,56,55,91,3,60,40,63,47,47,82,21,82,57,6,74,56,40,1,14,81,98,29,25,31,4,9,82,75,45,45,30,57,33,17,59,29,11,25,0,2,19,5,12,31,48,33,65,80,53,17,12,31,48,36,38,88,65,15,70,19,41,29,66,5,39,21,82,94,89,75,82,31,45,52,29,83,49,77,33,36,52,3,88,55,51,0,6,69,81,57,71,88,5,98,87,26,83,48,8,78,74,72,10,93,45,84,87,95,7,86,14,10,82,46,30,3,78,97,78,7,34,61,20,98,22,26,44,44,58,93,33,29,42,45,8,3,65,68,74,70,52,77,86,44,17,15,61,30,19,9,56,30,64,64,91,4,76,70,78,39,43,91,81,72,26,44,42,76,46,45,61,28,7,6,58,72,36,80,42,55,90,0,48,61,5,91,51,43,72,55,44,37,0,1,90,9,6,81,29,0,81,40,30,18,25,54,25,88,16,86,43,49,8,79,1,77,45,92,25,32,66,48,67,48,73,57,78,95,9,77,89,10,52,76,42,56,58,79,45,18,9,51,42,86,14,37,38,30,18,74,29,77,82,35,64,15,28,47,64,25,53,80,84,14,90,6,74,67,57,79,83,37,99,10,5,85,43,78,94,72,2,26,16,14,63,73,11,56,31,38,37,48,94,51,26,95,66,77,66,91,58,43,56,17,89,79,56,3,75,51,74,49,4,59,62,39,42,26,37,29,69,24,7,2,9,32,6,38,92,0,47,92,39,76,17,12,10,92,93,4,93,96,54,83,87,90,65,26,32,47,33,59,85,16,41,5,58,49,18,43,28,94,16,31,86,42,72,63,70,35,13,61,52,81,7,57,1,53,69,52,47,4,50,2,46,94,47,32,87,63,71,86,71,36,29,52,68,50,28,99,37,85,82,76,49,83,40,22,58,18,12,28,48,70,23,54,33,15,71,38,32,39,60,91,56,94,53,84,98,50,16,97,4,15,25,22,75,93,3021
1,61,41,92,10,76,10,57,46,56,1,99,66,66,19,2,57,39,13,64,68,45,60,73,64,49,36,8,62,5,70,90,24,88,9,26,41,41,13,38,62,69,92,77,27,78,32,2,96,2,49,97,31,96,48,11,61,78,39,13,54,28,52,85,35,59,20,83,69,65,97,60,54,48,25,66,75,65,83,37,85,2,2,85,27,15,12,13,49,59,53,37,16,46,83,29,12,17,81,23,16,80,16,65,85,85,3,25,68,70,48,14,18,99,68,88,10,38,67,49,55,26,75,36,60,47,74,91,6,86,4,91,97,41,9,30,78,15,48,83,42,38,86,96,74,78,74,98,76,55,57,20,48,80,65,38,35,0,92,13,46,49,91,53,73,23,49,90,15,30,49,5,37,61,57,82,87,17,82,45,54,30,45,45,80,69,27,10,29,24,26,74,5,23,21,11,68,75,75,57,17,41,41,70,55,65,88,93,56,7,81,50,87,21,20,64,41,16,31,30,57,19,62,45,71,23,39,43,37,4,63,98,74,58,77,4,19,96,45,4,90,40,76,31,36,17,70,56,59,85,41,23,73,17,78,23,36,25,99,72,17,40,7,13,27,77,55,13,81,72,5,43,65,89,85,17,31,29,1,11,76,62,48,75,21,42,48,5,12,29,25,76,41,92,69,59,0,5,90,79,10,82,68,24,2,54,33,22,32,92,93,6,85,85,76,73,68,96,54,30,96,45,4,90,69,3,96,16,2,46,59,13,47,10,8,70,42,65,21,74,17,61,6,12,29,16,38,38,39,86,5,6,85,74,38,98,11,62,24,3,34,35,31,71,51,95,43,71,93,52,49,3,43,92,50,64,44,92,95,91,86,90,30,40,64,59,37,6,39,51,99,87,54,37,45,87,42,94,77,52,26,14,42,31,62,64,55,52,0,77,96,66,39,78,72,67,87,56,68,57,64,5,19,42,19,38,76,66,88,67,80,94,69,5,45,33,26,85,2,3,19,62,55,50,58,43,68,79,90,9,5,42,94,94,2,70,93,66,31,52,79,76,0,62,42,8,53,73,45,87,14,51,26,62,50,71,44,90,2,3,50,94,27,56,63,11,25,3,82,58,70,73,27,96,29,94,53,42,53,80,51,410
2,22,26,94,43,8,23,16,98,79,34,97,24,26,33,25,81,25,63,39,24,52,46,40,44,54,43,58,52,88,60,86,41,67,30,91,38,47,35,28,49,4,96,8,89,73,49,94,62,23,42,86,83,38,36,85,21,47,92,50,65,18,77,43,64,53,96,61,83,33,66,36,68,10,16,35,92,53,4,82,2,56,82,50,57,95,59,38,75,17,57,5,85,67,89,68,90,17,97,48,42,26,46,55,72,33,24,90,10,89,28,40,19,21,52,27,37,16,51,22,9,53,79,12,20,63,59,95,81,7,33,98,86,21,42,38,43,72,50,37,59,87,9,46,47,25,89,72,25,16,57,57,63,6,26,23,10,21,79,71,8,62,16,55,15,72,87,2,38,27,33,35,34,15,68,31,58,30,92,13,42,85,97,63,70,77,77,34,86,65,91,33,67,67,0,55,80,87,5,14,49,36,48,67,95,6,94,9,65,58,25,44,22,22,60,84,9,61,79,51,36,58,30,39,16,53,15,79,67,5,99,59,17,84,36,79,91,46,73,27,88,4,83,60,69,52,24,4,35,28,85,97,29,81,58,11,85,78,33,54,46,32,95,97,92,0,75,90,80,34,3,67,97,90,54,64,57,11,88,59,24,81,79,17,39,92,45,34,57,74,82,50,14,32,5,15,34,23,8,86,20,66,70,29,45,70,57,32,72,15,63,3,91,89,90,55,64,61,18,87,24,80,74,99,13,50,96,51,17,5,72,95,11,68,98,20,93,12,24,74,82,5,22,21,2,78,70,93,35,46,20,62,53,87,68,93,67,32,59,38,68,56,61,17,6,34,33,2,9,75,52,84,68,14,24,17,73,2,29,12,15,55,32,19,64,46,62,68,99,85,44,73,82,86,63,63,21,67,96,0,14,78,52,25,51,51,80,17,88,50,62,33,71,34,34,85,72,79,38,11,16,86,93,0,84,5,84,95,45,1,21,1,24,78,24,42,34,10,90,10,3,31,64,11,5,29,22,87,39,61,24,18,41,48,6,16,38,18,17,94,80,44,66,32,6,85,56,91,2,60,63,89,49,67,99,48,70,1,39,99,52,49,7,42,9,19,98,35,17,59,76,85,17,44,48,15,14,55,27,82,38,1118
3,26,71,94,94,97,11,69,13,61,99,69,78,28,36,68,71,32,82,63,75,91,56,8,67,65,66,33,35,35,71,57,76,73,66,18,15,32,46,64,73,47,44,5,8,97,88,49,69,12,62,33,23,69,77,57,38,53,2,41,32,56,78,40,27,99,50,59,82,74,55,63,2,67,22,7,67,51,12,22,97,79,29,54,46,59,62,79,19,40,90,59,33,39,92,45,28,3,87,39,21,41,39,28,67,63,48,64,58,62,59,70,84,45,95,4,89,44,97,94,4,32,14,25,48,72,91,56,4,39,0,56,76,26,45,86,78,2,46,51,0,94,76,43,40,16,70,67,32,77,78,25,4,88,47,18,57,84,51,31,22,37,50,54,62,76,21,76,42,7,9,75,0,75,33,16,73,15,64,34,75,33,18,64,95,41,39,68,98,76,99,48,8,71,76,54,10,73,19,97,60,34,47,9,4,71,2,46,52,1,24,18,67,91,20,72,75,91,52,52,8,39,39,71,65,97,45,5,10,24,19,71,67,36,55,51,59,27,59,50,33,43,9,33,40,83,4,84,52,27,18,65,26,55,4,67,26,19,1,83,95,85,18,97,84,22,19,20,34,79,99,71,78,39,27,91,67,28,61,23,58,92,49,81,60,21,51,40,32,58,68,76,22,40,75,30,14,62,33,21,33,93,65,56,6,41,35,65,38,49,83,91,60,29,18,71,75,55,13,50,22,47,38,67,21,96,42,78,30,33,59,52,42,63,42,99,28,66,51,93,65,32,7,11,24,17,52,98,25,75,1,58,44,30,70,77,50,91,46,6,63,66,94,37,65,87,96,15,68,38,32,3,65,21,29,43,46,81,97,90,59,47,27,2,48,24,37,23,26,33,21,7,98,85,21,29,7,14,23,6,68,73,92,55,61,9,99,86,93,88,37,64,80,26,52,67,21,8,74,76,11,86,1,87,4,80,44,13,28,49,25,46,54,13,99,51,22,87,46,9,46,48,6,57,78,44,35,31,31,32,67,63,56,40,23,98,77,42,76,15,9,98,75,94,63,58,60,71,9,67,97,31,59,97,46,64,54,22,30,76,52,73,40,8,1,33,61,89,49,66,90,65,32,20,21,99,29,82,70,4,17,6674
4,30,11,75,75,79,6,0,11,38,21,65,82,93,9,40,67,32,55,30,32,76,61,69,86,0,67,4,38,50,32,70,52,16,90,84,62,25,82,4,19,92,3,6,46,92,49,28,7,50,60,20,88,67,27,97,57,53,19,83,89,3,45,83,70,19,86,65,95,93,30,89,48,46,58,79,78,16,8,48,17,22,55,43,58,90,19,72,65,94,17,14,9,64,22,16,49,56,75,4,89,74,39,65,53,60,9,67,49,96,52,99,81,46,4,67,26,70,49,27,25,41,94,20,13,59,48,13,73,91,5,76,62,89,67,56,66,78,72,72,75,75,83,9,34,20,33,0,91,1,53,66,88,85,73,43,36,1,88,37,87,55,15,3,41,41,72,42,85,23,75,52,71,25,28,99,69,47,18,71,52,99,20,56,50,58,63,85,86,57,88,76,29,13,2,48,22,18,47,61,65,80,91,55,88,46,43,79,27,7,82,19,45,19,61,5,24,4,64,15,82,63,59,80,16,35,26,6,94,35,67,98,97,53,65,52,38,2,42,52,15,80,44,22,99,52,81,76,4,52,67,70,53,96,8,41,54,41,71,11,43,71,16,18,43,53,65,80,0,49,98,88,81,42,43,71,47,84,89,73,38,21,6,22,48,9,95,20,38,56,49,56,62,68,88,92,77,87,90,43,29,24,67,59,18,55,24,88,47,51,69,91,40,90,49,29,33,73,54,59,0,42,54,56,31,6,21,99,98,2,18,94,14,85,65,25,43,98,55,83,94,57,16,8,60,56,13,82,23,93,94,74,20,33,36,4,36,50,62,53,3,79,71,94,69,62,3,81,76,6,75,36,77,28,20,22,14,14,85,51,79,96,62,24,28,3,39,74,94,34,10,14,77,13,75,12,86,31,50,66,2,85,56,89,23,98,17,0,75,88,71,71,4,38,62,89,40,23,74,18,57,82,76,21,66,78,76,83,95,78,13,23,65,37,82,91,20,67,77,52,4,43,14,19,51,32,83,73,73,72,27,11,95,64,54,64,6,11,13,79,90,27,12,59,93,31,71,12,74,58,48,36,32,0,46,48,89,91,15,95,90,17,29,96,5,91,66,85,30,14,14,43,39,34,13,16,44,67,54,8,27,825
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
290085,50,61,95,79,76,46,81,48,49,97,5,66,32,93,17,94,34,67,13,55,10,20,56,39,31,67,57,81,46,90,84,61,98,61,8,82,0,47,52,17,70,59,99,98,23,67,9,64,38,50,92,32,17,41,33,12,90,35,20,42,34,47,23,22,96,20,10,64,17,93,59,12,49,19,17,19,59,43,7,72,87,37,7,37,62,4,52,42,87,5,39,92,83,94,62,86,47,44,12,21,5,82,31,13,79,95,17,47,49,59,23,72,34,77,24,37,65,89,15,2,89,21,89,82,20,53,20,73,19,97,91,17,34,26,56,27,24,50,69,17,71,45,34,56,17,29,44,65,16,28,62,53,46,88,10,20,31,91,7,28,10,59,47,10,57,31,0,75,91,84,32,43,36,53,31,38,28,56,77,15,79,88,91,20,89,83,9,40,55,90,73,36,78,76,43,93,49,77,76,17,66,72,32,25,26,65,46,62,95,85,62,69,53,7,5,29,30,71,22,95,79,84,12,70,22,12,56,68,45,53,36,85,36,38,67,73,55,18,75,84,63,52,44,46,51,15,65,80,85,19,2,61,9,1,88,78,27,69,37,28,92,38,79,9,1,32,77,65,71,74,59,53,18,25,65,63,7,27,49,65,81,88,49,23,5,16,69,52,83,58,65,22,42,95,64,73,29,7,90,35,38,76,32,46,15,96,8,10,63,65,20,83,47,60,51,46,46,45,33,77,43,54,18,43,85,26,33,80,0,85,15,34,64,11,96,90,15,65,77,83,61,78,60,92,51,98,12,37,32,11,31,96,79,0,37,35,5,34,4,26,14,16,98,94,39,42,61,54,13,10,48,41,75,10,6,10,93,27,71,78,60,1,77,74,36,86,37,58,20,62,23,41,84,10,24,0,88,82,33,3,34,99,90,65,31,15,8,62,19,39,60,42,38,89,70,0,87,60,74,29,7,78,73,14,71,77,90,49,7,90,1,50,19,36,80,60,1,58,77,27,60,15,79,53,0,30,60,99,96,28,37,36,35,27,59,2,59,70,93,90,71,66,58,33,12,52,75,41,18,71,98,99,6,51,31,83,8,16,10,15,38,29,16,86,49,55,94,33,79,70,43,83,70,87,99,6,19,30,80,19,4819
290086,88,90,73,44,17,2,73,22,99,95,64,81,67,19,11,8,49,10,44,72,70,74,1,78,40,98,26,55,78,68,69,78,39,3,40,56,22,77,85,85,63,34,72,55,27,24,45,72,66,83,57,22,5,78,2,33,93,84,0,62,20,32,89,40,71,61,49,17,89,57,95,17,32,25,99,4,28,26,84,37,69,38,13,80,13,12,89,86,17,29,46,58,87,2,32,16,66,85,36,13,26,21,83,98,17,17,45,45,77,42,22,5,80,74,73,78,16,66,26,49,22,26,30,47,78,21,78,36,23,12,57,42,74,29,9,55,19,60,93,17,44,89,23,41,47,66,16,56,81,20,70,57,90,62,41,15,89,27,25,68,83,78,61,46,55,40,51,52,27,11,20,93,0,54,42,73,28,95,19,58,68,11,10,17,69,44,97,83,21,64,67,49,4,70,21,64,6,13,94,27,90,56,60,37,75,95,62,82,85,99,25,68,66,1,10,44,59,12,9,86,99,9,12,41,93,53,39,31,87,62,71,61,0,89,77,84,71,42,34,92,75,23,9,80,4,93,9,59,83,68,20,41,10,72,78,78,37,52,9,26,35,87,77,81,99,15,99,44,17,88,17,39,63,3,49,0,48,91,37,6,30,11,29,1,33,32,32,0,77,82,94,63,20,94,70,42,34,14,89,94,85,93,95,51,15,41,21,6,71,60,68,61,8,24,60,67,90,19,47,27,48,75,11,72,23,21,24,69,77,42,40,91,58,28,9,85,32,44,31,97,12,15,37,8,73,87,21,56,8,93,37,27,79,82,12,36,29,75,25,38,18,10,87,54,52,59,61,8,64,96,50,27,53,49,66,21,9,7,8,65,61,65,18,35,66,18,34,65,34,94,17,45,89,88,1,20,33,10,27,1,4,29,63,51,43,7,41,81,19,14,36,24,93,66,33,75,26,91,77,72,17,70,90,89,75,18,27,48,2,40,89,85,34,65,88,3,10,96,57,48,90,91,42,3,22,93,47,50,95,89,63,41,32,20,98,96,32,93,99,98,44,74,50,42,27,98,1,43,6,31,65,1,8,14,97,26,0,47,77,58,81,19,59,53,38,94,39,65,23,9,38,50,88,97,28,64,90,66,90,6,3960
290087,23,73,80,4,60,18,64,14,40,58,11,10,1,70,18,46,73,10,38,71,62,33,55,50,94,58,96,39,77,59,58,22,96,41,68,96,29,53,94,5,91,31,4,94,41,97,92,2,83,65,31,29,96,54,95,27,66,54,64,89,38,6,63,88,11,40,56,59,25,48,13,36,12,5,35,32,42,21,70,12,77,11,10,54,50,22,84,85,17,60,20,39,55,94,8,89,55,32,69,72,88,58,21,19,23,38,45,78,23,79,82,67,64,90,60,14,47,98,19,50,47,47,89,4,0,49,57,89,54,50,65,69,87,98,88,30,64,86,90,40,59,64,47,15,50,2,82,46,90,3,20,50,84,75,56,50,86,30,32,22,6,6,96,72,22,16,36,46,20,20,44,21,73,16,65,91,8,45,89,91,78,70,30,59,6,58,91,56,14,54,57,89,6,57,48,63,5,63,24,14,40,65,97,54,90,75,34,21,44,79,52,13,45,32,62,52,77,85,64,21,90,64,67,9,75,20,73,55,74,54,70,5,43,86,35,8,87,88,34,97,75,71,41,17,86,14,9,81,36,64,43,92,80,96,44,65,34,25,25,15,78,77,68,81,63,18,19,68,17,49,5,94,1,6,56,28,79,55,16,39,87,55,56,95,93,11,98,64,76,46,89,49,68,97,28,70,63,75,47,62,64,96,22,84,82,28,34,53,75,15,50,1,50,83,55,91,35,76,7,1,56,50,28,83,36,91,88,99,29,41,43,7,11,42,81,43,48,21,3,84,63,66,94,19,41,97,66,20,43,3,59,42,21,52,73,0,80,33,12,32,81,46,71,13,36,48,56,4,42,75,43,62,0,75,9,89,87,96,44,13,76,30,91,16,60,68,56,41,36,29,77,20,82,62,68,89,53,44,55,8,74,0,45,21,7,38,2,81,10,80,71,23,59,62,30,40,43,63,81,63,91,45,69,44,20,77,78,6,7,16,44,52,86,57,9,34,96,75,67,88,49,93,70,6,12,62,7,43,51,75,74,27,27,51,6,40,31,58,61,95,0,15,32,68,35,58,35,95,37,84,16,56,77,63,68,53,10,55,65,54,37,34,25,75,95,39,22,14,65,90,65,19,49,50,36,92,9,6,45,64,292
290088,25,6,75,74,26,56,32,33,57,44,49,23,46,70,91,36,93,52,22,27,16,55,31,92,68,49,67,94,86,27,5,98,99,50,7,59,88,80,70,72,25,61,70,22,19,97,65,92,12,0,27,47,81,86,58,33,56,64,46,73,86,59,61,50,75,30,52,49,93,13,60,89,47,29,24,81,8,36,20,35,24,25,74,50,71,13,58,17,63,19,86,83,5,64,52,87,12,86,19,6,88,93,87,52,93,43,46,83,97,65,64,5,52,0,54,31,36,77,92,42,32,24,59,20,68,35,67,90,98,30,73,71,15,90,43,30,1,41,68,39,5,36,88,32,20,99,59,77,16,69,26,12,47,24,99,79,81,51,10,65,82,83,23,52,86,74,88,25,54,77,93,19,30,25,54,40,56,16,86,8,43,3,93,43,54,22,40,75,89,1,58,41,35,55,43,88,19,79,57,29,18,76,27,49,85,94,8,8,17,84,31,27,11,27,58,5,74,1,94,71,23,74,89,19,18,40,98,38,36,47,6,52,3,67,81,33,33,37,19,93,1,39,88,77,35,4,37,2,49,49,47,84,75,76,91,80,50,82,8,53,3,56,45,0,93,5,47,39,70,20,30,25,3,93,54,40,55,92,64,74,76,73,96,23,41,17,23,77,20,28,54,4,63,54,92,24,63,19,15,55,0,7,93,71,43,20,2,69,18,93,22,82,15,77,96,11,24,85,12,91,92,47,67,18,87,21,55,44,81,92,73,8,10,92,48,47,11,28,93,18,29,61,89,47,86,56,82,76,67,40,89,56,10,76,95,22,33,83,42,36,49,63,12,44,67,55,4,11,36,37,10,21,41,3,56,28,8,21,54,55,54,28,8,33,36,62,77,42,34,12,93,27,82,26,78,38,47,14,40,84,88,27,62,84,67,36,83,75,61,79,24,3,3,52,87,24,21,85,45,6,63,82,15,37,35,76,35,96,77,59,28,74,35,31,78,32,96,69,43,62,53,97,54,74,2,15,32,32,3,15,97,89,82,41,57,28,62,51,4,91,74,50,67,36,11,43,84,99,6,20,28,14,59,84,48,26,35,1,25,52,7,50,45,70,16,67,38,45,27,29,78,13,48,67,98,72,10,16,22,30,444


In [17]:
%%time
pd_df[pd_df.col2>70]

# summary : pandas slower in filtering

Wall time: 10.2 s


Unnamed: 0,col0,col1,col2,col3,col4,col5,col6,col7,col8,col9,...,col491,col492,col493,col494,col495,col496,col497,col498,col499,multiplication_col13
0,98,10,87,81,97,91,31,70,42,30,...,10,88,16,66,41,12,50,49,15,810
2,29,57,98,15,60,80,71,89,63,26,...,61,32,91,62,27,43,14,59,80,855
3,18,62,81,94,11,35,54,97,0,27,...,25,50,21,94,32,86,24,8,11,5828
7,80,11,93,25,98,42,5,83,12,12,...,19,45,46,23,97,40,99,81,14,275
10,18,59,76,36,12,89,31,92,81,28,...,47,28,51,97,25,78,16,12,83,2124
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
999987,22,40,71,90,47,9,9,35,92,25,...,23,48,11,95,9,27,73,89,46,3600
999993,26,35,90,28,97,87,89,29,15,10,...,30,11,67,78,7,43,40,77,12,980
999996,69,32,97,50,18,9,90,53,60,19,...,57,81,62,12,10,61,58,84,46,1600
999997,88,75,78,99,30,60,94,44,13,56,...,3,95,95,48,12,9,40,20,7,7425


In [18]:
dff=vaex_df[vaex_df.col2>70]  ##Here Filtering will not make a memory copy

In [19]:
### All the agorithms work out of core, the limit is the size of your harddriver
dff.col2.minmax(progress='widget')

HBox(children=(FloatProgress(value=0.0, max=1.0), Label(value='In progress...')))

array([71, 99], dtype=int64)

### Fast groupby / aggregations
Vaex implements parallelized, highly performant groupby operations, especially when using categories (>1 billion/second).

In [20]:
%%time
vaex_df_group=vaex_df.groupby(vaex_df.col1,agg=vaex.agg.mean(vaex_df.col4))
vaex_df_group

Wall time: 78.6 ms


#,col1,col4_mean
0,6,49.369004413928394
1,24,49.74346912220999
2,78,49.37421352242085
3,54,49.90093402225755
4,57,49.70840932117528
...,...,...
95,94,49.425266362252664
96,83,49.53386454183267
97,82,49.7075
98,88,49.29712932820361


In [21]:
%%time
vaex_df.groupby(vaex_df.col1,agg='count')

Wall time: 26 ms


#,col1,count
0,6,10195
1,24,9991
2,78,10013
3,54,10064
4,57,9870
...,...,...
95,94,9855
96,83,9789
97,82,10000
98,88,10137
