In [1]:
import pandas as pd
import numpy as np

In [2]:
df_train = pd.read_csv('train.csv')
df_test = pd.read_csv('test.csv')
df_bids = pd.read_csv('bids.csv')

In [3]:
pd.options.display.max_columns = None
pd.options.display.max_rows = None

## Explore Data

In [4]:
df_train.info(max_cols=200)

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 2013 entries, 0 to 2012
Data columns (total 4 columns):
bidder_id          2013 non-null object
payment_account    2013 non-null object
address            2013 non-null object
outcome            2013 non-null float64
dtypes: float64(1), object(3)
memory usage: 63.0+ KB


In [5]:
df_bids.info(max_cols=200)

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 7656334 entries, 0 to 7656333
Data columns (total 9 columns):
bid_id         int64
bidder_id      object
auction        object
merchandise    object
device         object
time           int64
country        object
ip             object
url            object
dtypes: int64(2), object(7)
memory usage: 525.7+ MB


In [6]:
df_test.info(max_cols=200)

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 4700 entries, 0 to 4699
Data columns (total 3 columns):
bidder_id          4700 non-null object
payment_account    4700 non-null object
address            4700 non-null object
dtypes: object(3)
memory usage: 110.2+ KB


In [7]:
df_train.head(3)

Unnamed: 0,bidder_id,payment_account,address,outcome
0,91a3c57b13234af24875c56fb7e2b2f4rb56a,a3d2de7675556553a5f08e4c88d2c228754av,a3d2de7675556553a5f08e4c88d2c228vt0u4,0.0
1,624f258b49e77713fc34034560f93fb3hu3jo,a3d2de7675556553a5f08e4c88d2c228v1sga,ae87054e5a97a8f840a3991d12611fdcrfbq3,0.0
2,1c5f4fc669099bfbfac515cd26997bd12ruaj,a3d2de7675556553a5f08e4c88d2c2280cybl,92520288b50f03907041887884ba49c0cl0pd,0.0


In [8]:
df_bids.head(3)

Unnamed: 0,bid_id,bidder_id,auction,merchandise,device,time,country,ip,url
0,0,8dac2b259fd1c6d1120e519fb1ac14fbqvax8,ewmzr,jewelry,phone0,9759243157894736,us,69.166.231.58,vasstdc27m7nks3
1,1,668d393e858e8126275433046bbd35c6tywop,aeqok,furniture,phone1,9759243157894736,in,50.201.125.84,jmqlhflrzwuay9c
2,2,aa5f360084278b35d746fa6af3a7a1a5ra3xe,wa00e,home goods,phone2,9759243157894736,py,112.54.208.157,vasstdc27m7nks3


In [9]:
df_test.head(3)

Unnamed: 0,bidder_id,payment_account,address
0,49bb5a3c944b8fc337981cc7a9ccae41u31d7,a3d2de7675556553a5f08e4c88d2c228htx90,5d9fa1b71f992e7c7a106ce4b07a0a754le7c
1,a921612b85a1494456e74c09393ccb65ylp4y,a3d2de7675556553a5f08e4c88d2c228rs17i,a3d2de7675556553a5f08e4c88d2c228klidn
2,6b601e72a4d264dab9ace9d7b229b47479v6i,925381cce086b8cc9594eee1c77edf665zjpl,a3d2de7675556553a5f08e4c88d2c228aght0


In [10]:
for column in df_bids.columns:
    print(column + ': {}'.format(len(df_bids[column].unique())))

bid_id: 7656334
bidder_id: 6614
auction: 15051
merchandise: 10
device: 7351
time: 776529
country: 200
ip: 2303991
url: 1786351


In [11]:
for column in df_train.columns:
    print(column + ': {}'.format(len(df_train[column].unique())))

bidder_id: 2013
payment_account: 2013
address: 2013
outcome: 2


In [12]:
for column in df_test.columns:
    print(column + ': {}'.format(len(df_test[column].unique())))

bidder_id: 4700
payment_account: 4700
address: 4700


## join tables to create dataset

In [13]:
df_joined_train = pd.merge(df_bids, df_train, on='bidder_id', how='inner')
df_joined_test = pd.merge(df_bids, df_test, on='bidder_id', how='inner')

## Explore Data

In [14]:
df_joined_train.info(max_cols=200)

<class 'pandas.core.frame.DataFrame'>
Int64Index: 3071224 entries, 0 to 3071223
Data columns (total 12 columns):
bid_id             int64
bidder_id          object
auction            object
merchandise        object
device             object
time               int64
country            object
ip                 object
url                object
payment_account    object
address            object
outcome            float64
dtypes: float64(1), int64(2), object(9)
memory usage: 304.6+ MB


In [15]:
df_joined_test.info(max_cols=200)

<class 'pandas.core.frame.DataFrame'>
Int64Index: 4585110 entries, 0 to 4585109
Data columns (total 11 columns):
bid_id             int64
bidder_id          object
auction            object
merchandise        object
device             object
time               int64
country            object
ip                 object
url                object
payment_account    object
address            object
dtypes: int64(2), object(9)
memory usage: 419.8+ MB


In [16]:
df_joined_train.head(3)

Unnamed: 0,bid_id,bidder_id,auction,merchandise,device,time,country,ip,url,payment_account,address,outcome
0,1,668d393e858e8126275433046bbd35c6tywop,aeqok,furniture,phone1,9759243157894736,in,50.201.125.84,jmqlhflrzwuay9c,a3d2de7675556553a5f08e4c88d2c228ucoac,42a3b61a1fe69d66ad60f3e347aa09b1erfe2,0.0
1,25,668d393e858e8126275433046bbd35c6tywop,38v0a,furniture,phone4,9759243315789473,bd,147.64.206.30,vasstdc27m7nks3,a3d2de7675556553a5f08e4c88d2c228ucoac,42a3b61a1fe69d66ad60f3e347aa09b1erfe2,0.0
2,39,668d393e858e8126275433046bbd35c6tywop,aeqok,furniture,phone35,9759243368421052,in,75.11.239.20,i92xwb95qdo901j,a3d2de7675556553a5f08e4c88d2c228ucoac,42a3b61a1fe69d66ad60f3e347aa09b1erfe2,0.0


In [17]:
df_joined_test.head(3)

Unnamed: 0,bid_id,bidder_id,auction,merchandise,device,time,country,ip,url,payment_account,address
0,0,8dac2b259fd1c6d1120e519fb1ac14fbqvax8,ewmzr,jewelry,phone0,9759243157894736,us,69.166.231.58,vasstdc27m7nks3,a3d2de7675556553a5f08e4c88d2c2282ay1v,7f4c6ac489cbd95e38e4f093bb308af5jae25
1,14,8dac2b259fd1c6d1120e519fb1ac14fbqvax8,wberf,jewelry,phone15,9759243263157894,au,134.243.148.253,vasstdc27m7nks3,a3d2de7675556553a5f08e4c88d2c2282ay1v,7f4c6ac489cbd95e38e4f093bb308af5jae25
2,106,8dac2b259fd1c6d1120e519fb1ac14fbqvax8,hw5at,jewelry,phone80,9759243736842105,ke,227.231.81.211,v2gyrh0dbr31atn,a3d2de7675556553a5f08e4c88d2c2282ay1v,7f4c6ac489cbd95e38e4f093bb308af5jae25


#### label is outcome

In [None]:
for column in df_joined_test.columns:
    print(column + ': {}'.format(len(df_joined_test[column].unique())))

## slice df by auction_id

In [219]:
# do this for both training and test

auction_dictinoary = {}
auctions = df_joined_test['auction'].unique()
# auctions = df_joined_train['auction'].unique()

for auction in auctions:
    auction_dictinoary[auction] = df_joined_test.loc[df_joined_test['auction'] == auction]
#     auction_dictinoary[auction] = df_joined_train.loc[df_joined_train['auction'] == auction]
    
    print('id: {}, df_shape: {}'.format(auction, auction_dictinoary[auction].shape))

id: ewmzr, df_shape: (2068, 11)
id: wberf, df_shape: (4, 11)
id: hw5at, df_shape: (279, 11)
id: uw3sx, df_shape: (1410, 11)
id: q79ya, df_shape: (548, 11)
id: qcppg, df_shape: (2051, 11)
id: fqfbw, df_shape: (305, 11)
id: idfc3, df_shape: (942, 11)
id: 2yowp, df_shape: (2893, 11)
id: tp9bl, df_shape: (469, 11)
id: 3boba, df_shape: (3120, 11)
id: csvpq, df_shape: (46, 11)
id: fe96d, df_shape: (193, 11)
id: lfz7h, df_shape: (1561, 11)
id: 20fsz, df_shape: (906, 11)
id: tep1m, df_shape: (16508, 11)
id: fn6fr, df_shape: (1197, 11)
id: zfls2, df_shape: (578, 11)
id: skwyv, df_shape: (574, 11)
id: bggqz, df_shape: (732, 11)
id: wghzu, df_shape: (1279, 11)
id: xk5nb, df_shape: (422, 11)
id: 48olb, df_shape: (749, 11)
id: 77vfr, df_shape: (458, 11)
id: qtmwx, df_shape: (708, 11)
id: bstmq, df_shape: (2293, 11)
id: dt5o5, df_shape: (1044, 11)
id: n9b6x, df_shape: (674, 11)
id: f655d, df_shape: (244, 11)
id: 2uu2n, df_shape: (11767, 11)
id: g26sr, df_shape: (1707, 11)
id: 5m2x6, df_shape: (737, 

id: hcyv4, df_shape: (6, 11)
id: 34x8e, df_shape: (532, 11)
id: 8irza, df_shape: (516, 11)
id: ot9h5, df_shape: (31, 11)
id: zg1vo, df_shape: (12, 11)
id: dep5u, df_shape: (222, 11)
id: 7jwgb, df_shape: (3, 11)
id: vz8q9, df_shape: (421, 11)
id: j6xul, df_shape: (470, 11)
id: 9daf9, df_shape: (34, 11)
id: 5w73e, df_shape: (265, 11)
id: 408np, df_shape: (23, 11)
id: m6jxa, df_shape: (13, 11)
id: 62t0a, df_shape: (345, 11)
id: byib8, df_shape: (418, 11)
id: vvb6h, df_shape: (518, 11)
id: pfa9f, df_shape: (47, 11)
id: udb7l, df_shape: (402, 11)
id: 9waah, df_shape: (1591, 11)
id: bx2l4, df_shape: (32, 11)
id: 9z1le, df_shape: (16, 11)
id: pgymx, df_shape: (26, 11)
id: bgvgc, df_shape: (1686, 11)
id: 3zuwz, df_shape: (1556, 11)
id: qrfc2, df_shape: (323, 11)
id: nhc1n, df_shape: (3, 11)
id: xl5xn, df_shape: (90, 11)
id: wscxj, df_shape: (56, 11)
id: k6snz, df_shape: (285, 11)
id: kmpo5, df_shape: (44, 11)
id: drs2x, df_shape: (1168, 11)
id: w7htt, df_shape: (447, 11)
id: k5e3t, df_shape: (

id: ef0ef, df_shape: (27, 11)
id: ln020, df_shape: (816, 11)
id: 6144k, df_shape: (17, 11)
id: 4600j, df_shape: (24, 11)
id: qcro8, df_shape: (31, 11)
id: hxcvo, df_shape: (4, 11)
id: ou8dk, df_shape: (22, 11)
id: lcb6r, df_shape: (890, 11)
id: mb4la, df_shape: (80, 11)
id: hz7fz, df_shape: (9, 11)
id: mm43x, df_shape: (27, 11)
id: psk8p, df_shape: (4, 11)
id: ixoqw, df_shape: (420, 11)
id: xyncu, df_shape: (8, 11)
id: vzsaw, df_shape: (8, 11)
id: ijzo9, df_shape: (14, 11)
id: sxko0, df_shape: (1740, 11)
id: dywc2, df_shape: (128, 11)
id: ml31n, df_shape: (322, 11)
id: 9ucqf, df_shape: (9, 11)
id: qgx89, df_shape: (36, 11)
id: o0mdj, df_shape: (4, 11)
id: krztg, df_shape: (13, 11)
id: hdkcs, df_shape: (32, 11)
id: mjkhv, df_shape: (29, 11)
id: ujwe0, df_shape: (12, 11)
id: 5vwna, df_shape: (3, 11)
id: zo1p3, df_shape: (1051, 11)
id: bvxbf, df_shape: (33, 11)
id: bmm5t, df_shape: (40, 11)
id: 37l5c, df_shape: (24, 11)
id: lif9a, df_shape: (12, 11)
id: pldnu, df_shape: (16, 11)
id: rfpsc

id: lxmyo, df_shape: (2, 11)
id: bg5dh, df_shape: (18, 11)
id: zcosl, df_shape: (30, 11)
id: 8w0e8, df_shape: (128, 11)
id: y6235, df_shape: (9, 11)
id: av0w3, df_shape: (96, 11)
id: rqibp, df_shape: (17, 11)
id: iw8xl, df_shape: (1410, 11)
id: kjjnr, df_shape: (35, 11)
id: jg1c1, df_shape: (17, 11)
id: rkeam, df_shape: (13, 11)
id: zp0wr, df_shape: (2, 11)
id: q4uv7, df_shape: (64, 11)
id: v27wi, df_shape: (10, 11)
id: wa00e, df_shape: (97, 11)
id: 88xe3, df_shape: (351, 11)
id: ne9lq, df_shape: (117, 11)
id: ht9lw, df_shape: (66, 11)
id: d1um1, df_shape: (766, 11)
id: 78i4o, df_shape: (20, 11)
id: giyj4, df_shape: (990, 11)
id: 5pye9, df_shape: (396, 11)
id: gi05a, df_shape: (17968, 11)
id: 9xost, df_shape: (166, 11)
id: blkjh, df_shape: (6194, 11)
id: 5aaba, df_shape: (40, 11)
id: xin2t, df_shape: (28, 11)
id: pyy8k, df_shape: (774, 11)
id: 8ywoe, df_shape: (60, 11)
id: dowem, df_shape: (4, 11)
id: otczn, df_shape: (847, 11)
id: iq5be, df_shape: (2652, 11)
id: fkfln, df_shape: (41, 

id: cu9dk, df_shape: (237, 11)
id: u5dg6, df_shape: (132, 11)
id: nw777, df_shape: (190, 11)
id: qb9ad, df_shape: (139, 11)
id: ye64c, df_shape: (194, 11)
id: fwg6z, df_shape: (212, 11)
id: cjzh6, df_shape: (272, 11)
id: h0c8o, df_shape: (191, 11)
id: xig5x, df_shape: (210, 11)
id: 10zfj, df_shape: (529, 11)
id: thyqa, df_shape: (87, 11)
id: 85k6u, df_shape: (61, 11)
id: jmxhr, df_shape: (65, 11)
id: o3yt3, df_shape: (66, 11)
id: tw5gw, df_shape: (61, 11)
id: pyq31, df_shape: (115, 11)
id: 15qdl, df_shape: (35, 11)
id: 8disy, df_shape: (14, 11)
id: pg37c, df_shape: (214, 11)
id: 13gi4, df_shape: (47, 11)
id: 95yqc, df_shape: (6, 11)
id: q18qg, df_shape: (27, 11)
id: rqn9c, df_shape: (17, 11)
id: jklnk, df_shape: (121, 11)
id: 8qtjg, df_shape: (342, 11)
id: acbql, df_shape: (22, 11)
id: enigu, df_shape: (31, 11)
id: htiyi, df_shape: (128, 11)
id: 2y6y2, df_shape: (14, 11)
id: p142v, df_shape: (79, 11)
id: ay5c0, df_shape: (54, 11)
id: kpr78, df_shape: (116, 11)
id: zlt1w, df_shape: (23,

id: 1sgd8, df_shape: (321, 11)
id: krvi4, df_shape: (96, 11)
id: atsc4, df_shape: (58, 11)
id: 14ijz, df_shape: (211, 11)
id: 74lts, df_shape: (9, 11)
id: k1g7r, df_shape: (5377, 11)
id: 38v0a, df_shape: (4445, 11)
id: aeqok, df_shape: (5427, 11)
id: uo3lj, df_shape: (4198, 11)
id: h2xrf, df_shape: (6331, 11)
id: 1rc8d, df_shape: (4140, 11)
id: 4xjfh, df_shape: (90, 11)
id: 55y7n, df_shape: (4311, 11)
id: mrscj, df_shape: (542, 11)
id: 7msk4, df_shape: (4805, 11)
id: jkyzt, df_shape: (5125, 11)
id: 7etdx, df_shape: (6141, 11)
id: 2jqhl, df_shape: (1774, 11)
id: tcaab, df_shape: (8495, 11)
id: n6qxu, df_shape: (59, 11)
id: 4r2xe, df_shape: (101, 11)
id: qlqfz, df_shape: (385, 11)
id: 8l2m3, df_shape: (165, 11)
id: mpjse, df_shape: (520, 11)
id: o7jit, df_shape: (48, 11)
id: rcbeq, df_shape: (180, 11)
id: dm7xj, df_shape: (2297, 11)
id: zp95y, df_shape: (2, 11)
id: 2i2p9, df_shape: (57, 11)
id: 5o8mg, df_shape: (3, 11)
id: z8f76, df_shape: (5, 11)
id: syc9b, df_shape: (247, 11)
id: z2hw8

id: wicy8, df_shape: (393, 11)
id: bi9cv, df_shape: (1, 11)
id: tz03g, df_shape: (2, 11)
id: 6v22z, df_shape: (6, 11)
id: 0pvd4, df_shape: (10, 11)
id: c341p, df_shape: (38, 11)
id: 71xv5, df_shape: (33, 11)
id: usqk4, df_shape: (25, 11)
id: gzc9j, df_shape: (124, 11)
id: 8v721, df_shape: (76, 11)
id: iw81c, df_shape: (78, 11)
id: 16gks, df_shape: (110, 11)
id: vk3vz, df_shape: (50, 11)
id: zz4dz, df_shape: (100, 11)
id: skn87, df_shape: (14, 11)
id: alcb1, df_shape: (65, 11)
id: i9yuh, df_shape: (10, 11)
id: u0m8k, df_shape: (31, 11)
id: 9l6ps, df_shape: (1119, 11)
id: vosi7, df_shape: (3, 11)
id: cqb50, df_shape: (117, 11)
id: d6dyo, df_shape: (21, 11)
id: 5bi3y, df_shape: (540, 11)
id: 03n0o, df_shape: (21, 11)
id: uvo6j, df_shape: (182, 11)
id: lxkrp, df_shape: (13, 11)
id: u74qi, df_shape: (347, 11)
id: eg7i4, df_shape: (156, 11)
id: vrsb8, df_shape: (73, 11)
id: jpxg4, df_shape: (397, 11)
id: xs0cg, df_shape: (444, 11)
id: 54pf4, df_shape: (57, 11)
id: vi4bm, df_shape: (126, 11)


id: ne5be, df_shape: (1, 11)
id: asvbw, df_shape: (7, 11)
id: jr9vt, df_shape: (1, 11)
id: 6q1an, df_shape: (3, 11)
id: 1fd8w, df_shape: (2, 11)
id: 9e6f5, df_shape: (39, 11)
id: 4h2ob, df_shape: (38, 11)
id: umlyz, df_shape: (30, 11)
id: p7vfq, df_shape: (2, 11)
id: gms0v, df_shape: (106, 11)
id: lnq5p, df_shape: (6, 11)
id: j9pj0, df_shape: (1, 11)
id: w5puq, df_shape: (4, 11)
id: 42nps, df_shape: (6, 11)
id: rxzqi, df_shape: (25, 11)
id: coy1i, df_shape: (2, 11)
id: jbymh, df_shape: (24, 11)
id: g3eqb, df_shape: (12, 11)
id: qpslu, df_shape: (182, 11)
id: 5zw7j, df_shape: (12, 11)
id: cun3u, df_shape: (8, 11)
id: 6a4zq, df_shape: (54, 11)
id: uwhzs, df_shape: (1, 11)
id: q2upd, df_shape: (7, 11)
id: v2sfx, df_shape: (75, 11)
id: 8je1p, df_shape: (2, 11)
id: 25b5r, df_shape: (30, 11)
id: 5ovmg, df_shape: (22, 11)
id: 2l7wt, df_shape: (8, 11)
id: sp3ds, df_shape: (1, 11)
id: mwjzk, df_shape: (16, 11)
id: zdsnl, df_shape: (11, 11)
id: slnsu, df_shape: (8, 11)
id: fchwb, df_shape: (18, 

id: 6fzbm, df_shape: (771, 11)
id: tujb3, df_shape: (6, 11)
id: i9qc6, df_shape: (6, 11)
id: ch4uu, df_shape: (1, 11)
id: j9bji, df_shape: (32, 11)
id: xgzyu, df_shape: (4, 11)
id: f4srh, df_shape: (5, 11)
id: vnipz, df_shape: (10, 11)
id: dhy31, df_shape: (3, 11)
id: ym2x2, df_shape: (2, 11)
id: sh9ar, df_shape: (7, 11)
id: lh72r, df_shape: (17, 11)
id: ipscb, df_shape: (8, 11)
id: cmkc2, df_shape: (10, 11)
id: xbcyd, df_shape: (78, 11)
id: r9g6m, df_shape: (1, 11)
id: 0hyxf, df_shape: (3, 11)
id: roxhl, df_shape: (3, 11)
id: pekpv, df_shape: (4, 11)
id: a3j5i, df_shape: (16, 11)
id: hx8ea, df_shape: (3, 11)
id: fzie5, df_shape: (4, 11)
id: uz4dl, df_shape: (458, 11)
id: rn2h8, df_shape: (23, 11)
id: f7al4, df_shape: (2, 11)
id: 9y63m, df_shape: (5, 11)
id: jm80p, df_shape: (56, 11)
id: m542h, df_shape: (1, 11)
id: wdkmw, df_shape: (7, 11)
id: iq4pq, df_shape: (239, 11)
id: 1ri0k, df_shape: (1, 11)
id: 5txbk, df_shape: (4, 11)
id: 8iy1a, df_shape: (4, 11)
id: unr3r, df_shape: (2, 11)


id: tj4f7, df_shape: (10, 11)
id: 49nqa, df_shape: (24, 11)
id: i2x23, df_shape: (11, 11)
id: 8505w, df_shape: (11, 11)
id: hafvx, df_shape: (5, 11)
id: mky6h, df_shape: (6, 11)
id: mqubc, df_shape: (7, 11)
id: 104nq, df_shape: (7, 11)
id: agw49, df_shape: (7, 11)
id: ho895, df_shape: (17, 11)
id: 31le6, df_shape: (4, 11)
id: h10ni, df_shape: (207, 11)
id: lc7b9, df_shape: (26, 11)
id: f2qdr, df_shape: (64, 11)
id: uz8pd, df_shape: (5, 11)
id: u58l6, df_shape: (23, 11)
id: vp231, df_shape: (1, 11)
id: 02c9i, df_shape: (20, 11)
id: sb5ho, df_shape: (6, 11)
id: jhh39, df_shape: (56, 11)
id: d8exy, df_shape: (26, 11)
id: bschi, df_shape: (1, 11)
id: hej9v, df_shape: (3, 11)
id: fouxu, df_shape: (32, 11)
id: z41vn, df_shape: (4, 11)
id: ycyt0, df_shape: (1, 11)
id: 4lmw5, df_shape: (25, 11)
id: zz59x, df_shape: (1, 11)
id: ctso3, df_shape: (1, 11)
id: mqyna, df_shape: (14, 11)
id: xt7bw, df_shape: (1, 11)
id: e3uix, df_shape: (15, 11)
id: 7yzin, df_shape: (1, 11)
id: 6971n, df_shape: (1, 1

id: p7z3n, df_shape: (61, 11)
id: 35cin, df_shape: (140, 11)
id: gh8iq, df_shape: (23, 11)
id: 0dgrn, df_shape: (1, 11)
id: e9p2w, df_shape: (2, 11)
id: fy84j, df_shape: (7, 11)
id: ipmp7, df_shape: (347, 11)
id: kddia, df_shape: (1, 11)
id: 9ps7l, df_shape: (1, 11)
id: wylh4, df_shape: (35, 11)
id: p72pw, df_shape: (13, 11)
id: 5fepo, df_shape: (6, 11)
id: r3mr7, df_shape: (95, 11)
id: ur441, df_shape: (6, 11)
id: 7da7p, df_shape: (1, 11)
id: p0bcc, df_shape: (919, 11)
id: 71tog, df_shape: (99, 11)
id: jrmtt, df_shape: (1, 11)
id: e3wtz, df_shape: (426, 11)
id: tsl3w, df_shape: (5, 11)
id: g5bhy, df_shape: (389, 11)
id: vfi3f, df_shape: (179, 11)
id: lyvj2, df_shape: (2, 11)
id: kojt7, df_shape: (3, 11)
id: 48x7g, df_shape: (158, 11)
id: 0aqcf, df_shape: (8, 11)
id: aq55o, df_shape: (103, 11)
id: todvj, df_shape: (162, 11)
id: xsm97, df_shape: (6, 11)
id: xvfy4, df_shape: (106, 11)
id: knq9b, df_shape: (45, 11)
id: a5qug, df_shape: (116, 11)
id: 4u1xz, df_shape: (24, 11)
id: 9676z, df

id: g6dbu, df_shape: (201, 11)
id: fnq8x, df_shape: (316, 11)
id: t67pq, df_shape: (104, 11)
id: 7gsyp, df_shape: (275, 11)
id: nhzvy, df_shape: (336, 11)
id: f3vhk, df_shape: (283, 11)
id: yxmqu, df_shape: (293, 11)
id: br3vi, df_shape: (12, 11)
id: u4n2h, df_shape: (89, 11)
id: i151o, df_shape: (24, 11)
id: 7jq73, df_shape: (644, 11)
id: fmvcv, df_shape: (88, 11)
id: 6ozff, df_shape: (631, 11)
id: 4pnrc, df_shape: (36, 11)
id: idb3a, df_shape: (8, 11)
id: p7bkw, df_shape: (111, 11)
id: bi6r1, df_shape: (86, 11)
id: vsy1m, df_shape: (19, 11)
id: 79kph, df_shape: (599, 11)
id: 4e2rt, df_shape: (44, 11)
id: r7haq, df_shape: (35, 11)
id: 3ex9l, df_shape: (17, 11)
id: b6850, df_shape: (21, 11)
id: 49dh6, df_shape: (97, 11)
id: 1t3ak, df_shape: (43, 11)
id: o469c, df_shape: (82, 11)
id: mlho1, df_shape: (42, 11)
id: nj6lq, df_shape: (226, 11)
id: 9ne77, df_shape: (13, 11)
id: f24yo, df_shape: (682, 11)
id: 5cuhe, df_shape: (18, 11)
id: nap6q, df_shape: (10, 11)
id: hfcvh, df_shape: (90, 11

id: m5gn3, df_shape: (1, 11)
id: 2sdqq, df_shape: (1, 11)
id: 31i2l, df_shape: (1, 11)
id: 7rs4v, df_shape: (14, 11)
id: v1p2v, df_shape: (12, 11)
id: uz49c, df_shape: (2, 11)
id: ly9nv, df_shape: (6, 11)
id: 61wzx, df_shape: (3, 11)
id: ci7b9, df_shape: (57, 11)
id: zb964, df_shape: (23, 11)
id: ib7bu, df_shape: (23, 11)
id: 4c3mb, df_shape: (21, 11)
id: 1prxi, df_shape: (1, 11)
id: wa146, df_shape: (81, 11)
id: maigg, df_shape: (27, 11)
id: k3m03, df_shape: (20, 11)
id: p5cgl, df_shape: (1, 11)
id: hposk, df_shape: (2, 11)
id: 3w1cj, df_shape: (2, 11)
id: rpt44, df_shape: (2, 11)
id: oijim, df_shape: (14, 11)
id: fwxd6, df_shape: (8, 11)
id: fmi9k, df_shape: (2, 11)
id: k2hn4, df_shape: (1, 11)
id: 33t80, df_shape: (2, 11)
id: 0ihb1, df_shape: (20, 11)
id: rnxkw, df_shape: (11, 11)
id: djm1l, df_shape: (12, 11)
id: 6w0wu, df_shape: (5, 11)
id: o3lyg, df_shape: (2, 11)
id: v3l4n, df_shape: (1, 11)
id: uxrk2, df_shape: (1, 11)
id: 2by4x, df_shape: (6, 11)
id: maytz, df_shape: (1, 11)
i

id: zahli, df_shape: (1, 11)
id: 9gv0e, df_shape: (54, 11)
id: 3ordk, df_shape: (3, 11)
id: 4u8e8, df_shape: (360, 11)
id: v81bi, df_shape: (7, 11)
id: 27ixe, df_shape: (2, 11)
id: vtu2c, df_shape: (68, 11)
id: pu2p9, df_shape: (2, 11)
id: pbx4o, df_shape: (2, 11)
id: fytsc, df_shape: (15, 11)
id: 16czn, df_shape: (2, 11)
id: wmwb9, df_shape: (6, 11)
id: s6s1k, df_shape: (2, 11)
id: xetgj, df_shape: (8, 11)
id: l2b7i, df_shape: (11, 11)
id: oc65c, df_shape: (7, 11)
id: 9pail, df_shape: (3, 11)
id: 9n4zb, df_shape: (11, 11)
id: lk13i, df_shape: (1, 11)
id: 61mas, df_shape: (4, 11)
id: 780hh, df_shape: (8, 11)
id: xfpxi, df_shape: (20, 11)
id: qy591, df_shape: (8, 11)
id: wwcjq, df_shape: (10, 11)
id: zt9ex, df_shape: (1, 11)
id: dj97y, df_shape: (2, 11)
id: n0ty3, df_shape: (2, 11)
id: bunn9, df_shape: (3, 11)
id: anj07, df_shape: (21, 11)
id: n7eu8, df_shape: (37, 11)
id: v5m71, df_shape: (6, 11)
id: 516mc, df_shape: (22, 11)
id: y0lzd, df_shape: (6, 11)
id: 97b3l, df_shape: (63, 11)
i

id: tpdxh, df_shape: (1, 11)
id: px1c4, df_shape: (3, 11)
id: knd4j, df_shape: (6, 11)
id: 5phhv, df_shape: (109, 11)
id: 6p1u3, df_shape: (2, 11)
id: hkd9l, df_shape: (14, 11)
id: w0qzh, df_shape: (7, 11)
id: e57jy, df_shape: (2, 11)
id: vmfnf, df_shape: (2, 11)
id: wqij9, df_shape: (7, 11)
id: n18ov, df_shape: (1, 11)
id: ss0ji, df_shape: (1, 11)
id: znhmr, df_shape: (10, 11)
id: chcmg, df_shape: (2, 11)
id: 7zgbz, df_shape: (1, 11)
id: y2pgm, df_shape: (6, 11)
id: somnq, df_shape: (2, 11)
id: gediy, df_shape: (4, 11)
id: 62yba, df_shape: (1, 11)
id: yffnx, df_shape: (3, 11)
id: vql1d, df_shape: (1, 11)
id: b36x2, df_shape: (2, 11)
id: ohm8w, df_shape: (2, 11)
id: j3975, df_shape: (6, 11)
id: 7nedy, df_shape: (62, 11)
id: z64n3, df_shape: (80, 11)
id: wsexe, df_shape: (4, 11)
id: hpqjd, df_shape: (21, 11)
id: s34ji, df_shape: (8, 11)
id: bv8jc, df_shape: (1, 11)
id: j1zp0, df_shape: (1, 11)
id: s1qqh, df_shape: (26, 11)
id: lcido, df_shape: (87, 11)
id: uanjc, df_shape: (25, 11)
id: 

id: 4hbfo, df_shape: (2, 11)
id: hrhiq, df_shape: (1, 11)
id: difx2, df_shape: (2, 11)
id: v8guk, df_shape: (1, 11)
id: 6uzlu, df_shape: (3, 11)
id: uscoi, df_shape: (2, 11)
id: vpt9v, df_shape: (8, 11)
id: ams7k, df_shape: (1, 11)
id: 9ot94, df_shape: (1, 11)
id: 1phco, df_shape: (3, 11)
id: lpade, df_shape: (3, 11)
id: 9v7tn, df_shape: (1, 11)
id: 69lj3, df_shape: (2, 11)
id: 3mh2u, df_shape: (2, 11)
id: rpzb9, df_shape: (10, 11)
id: lhxd8, df_shape: (1, 11)
id: ajy3t, df_shape: (1, 11)
id: a59py, df_shape: (3, 11)
id: 8g7ln, df_shape: (1, 11)
id: tq6eu, df_shape: (3, 11)
id: qbnaa, df_shape: (1, 11)
id: k0f32, df_shape: (1, 11)
id: kjiju, df_shape: (1, 11)
id: uxg9n, df_shape: (1, 11)
id: m9d4c, df_shape: (5, 11)
id: 8aolm, df_shape: (16, 11)
id: wmya0, df_shape: (39, 11)
id: dlnia, df_shape: (3, 11)
id: r9gpw, df_shape: (2, 11)
id: saqyk, df_shape: (2, 11)
id: 8ck94, df_shape: (5, 11)
id: x9suu, df_shape: (5, 11)
id: d93aq, df_shape: (1, 11)
id: kv8i8, df_shape: (4, 11)
id: fx20k, 

id: aslcx, df_shape: (4096, 11)
id: pqfbq, df_shape: (6457, 11)
id: aiywh, df_shape: (1564, 11)
id: aqswk, df_shape: (3548, 11)
id: fce2e, df_shape: (322, 11)
id: lsjsi, df_shape: (280, 11)
id: eymbx, df_shape: (215, 11)
id: z1iuy, df_shape: (21, 11)
id: zfjly, df_shape: (399, 11)
id: enf1x, df_shape: (42180, 11)
id: gox6f, df_shape: (328, 11)
id: efqf6, df_shape: (1285, 11)
id: ca1cz, df_shape: (1033, 11)
id: h23sy, df_shape: (21130, 11)
id: mz5di, df_shape: (47, 11)
id: 8en3h, df_shape: (6897, 11)
id: zz2zx, df_shape: (2403, 11)
id: uotsf, df_shape: (4005, 11)
id: hy5xd, df_shape: (5436, 11)
id: x8et8, df_shape: (2085, 11)
id: q4piy, df_shape: (1220, 11)
id: gst86, df_shape: (13190, 11)
id: dct7l, df_shape: (2902, 11)
id: mwws3, df_shape: (1281, 11)
id: lwgcc, df_shape: (9777, 11)
id: foo8f, df_shape: (1038, 11)
id: gja6c, df_shape: (12887, 11)
id: strbn, df_shape: (12810, 11)
id: 53qgu, df_shape: (291, 11)
id: 7brna, df_shape: (48, 11)
id: a67ry, df_shape: (163, 11)
id: 1ftck, df_sh

id: mtqvy, df_shape: (1228, 11)
id: hy3o6, df_shape: (119, 11)
id: irea8, df_shape: (3871, 11)
id: gddn2, df_shape: (607, 11)
id: b8j2z, df_shape: (8, 11)
id: 0y87g, df_shape: (385, 11)
id: ejyqb, df_shape: (3932, 11)
id: 7cqns, df_shape: (61, 11)
id: ensr9, df_shape: (136, 11)
id: k8cn3, df_shape: (63, 11)
id: o4oi7, df_shape: (9, 11)
id: 8wi2r, df_shape: (3084, 11)
id: 8xzwp, df_shape: (21, 11)
id: ucvo3, df_shape: (2819, 11)
id: lus5z, df_shape: (71, 11)
id: jjx15, df_shape: (86, 11)
id: dzngb, df_shape: (806, 11)
id: 0pc20, df_shape: (205, 11)
id: s8ys6, df_shape: (15618, 11)
id: 80vbf, df_shape: (1606, 11)
id: p907j, df_shape: (11, 11)
id: r98e0, df_shape: (109, 11)
id: qzqi5, df_shape: (119, 11)
id: qi62d, df_shape: (1110, 11)
id: 5ko0v, df_shape: (439, 11)
id: 741dd, df_shape: (196, 11)
id: g0ecv, df_shape: (1391, 11)
id: p98sh, df_shape: (6, 11)
id: sm0bp, df_shape: (2634, 11)
id: 7qncv, df_shape: (1146, 11)
id: 6423j, df_shape: (183, 11)
id: 08u1f, df_shape: (954, 11)
id: i1zt

id: bqcl3, df_shape: (665, 11)
id: xho5b, df_shape: (2122, 11)
id: 8499y, df_shape: (21, 11)
id: qlhl9, df_shape: (137, 11)
id: v772u, df_shape: (4443, 11)
id: 19emd, df_shape: (441, 11)
id: 58bkb, df_shape: (98, 11)
id: k3j8s, df_shape: (31, 11)
id: 8ce52, df_shape: (63, 11)
id: oxo9k, df_shape: (16, 11)
id: cq2rl, df_shape: (239, 11)
id: a75lx, df_shape: (638, 11)
id: sj68n, df_shape: (294, 11)
id: l3fp5, df_shape: (737, 11)
id: 17a0y, df_shape: (392, 11)
id: 8e6c7, df_shape: (5, 11)
id: twh2g, df_shape: (273, 11)
id: thcf2, df_shape: (107, 11)
id: 3rj7m, df_shape: (440, 11)
id: 6f3t4, df_shape: (555, 11)
id: ggqyk, df_shape: (72, 11)
id: 9vtnd, df_shape: (82, 11)
id: jcwt7, df_shape: (213, 11)
id: oav3x, df_shape: (36, 11)
id: f9jfi, df_shape: (41, 11)
id: 2n3xc, df_shape: (394, 11)
id: qw7df, df_shape: (591, 11)
id: edanb, df_shape: (1030, 11)
id: wd2hx, df_shape: (194, 11)
id: h1a1o, df_shape: (120, 11)
id: fwxlx, df_shape: (53, 11)
id: 8py1p, df_shape: (254, 11)
id: rcb25, df_sha

id: ypys3, df_shape: (30, 11)
id: yikqp, df_shape: (106, 11)
id: n1xyl, df_shape: (111, 11)
id: zmrzi, df_shape: (8, 11)
id: aqnq0, df_shape: (490, 11)
id: y7ads, df_shape: (442, 11)
id: yp5qm, df_shape: (63, 11)
id: zurpm, df_shape: (189, 11)
id: tmhm3, df_shape: (568, 11)
id: 3fma4, df_shape: (41, 11)
id: x9e41, df_shape: (99, 11)
id: u0sd0, df_shape: (542, 11)
id: l435t, df_shape: (580, 11)
id: 52bm2, df_shape: (178, 11)
id: mzy59, df_shape: (126, 11)
id: 42yv7, df_shape: (16, 11)
id: w9ybh, df_shape: (156, 11)
id: nuwwt, df_shape: (302, 11)
id: linu5, df_shape: (336, 11)
id: g6vpc, df_shape: (29, 11)
id: 5gci2, df_shape: (36, 11)
id: awusm, df_shape: (68, 11)
id: io44s, df_shape: (119, 11)
id: kvykx, df_shape: (444, 11)
id: q1pgh, df_shape: (16, 11)
id: ejd3n, df_shape: (936, 11)
id: 22mr6, df_shape: (21, 11)
id: h2oji, df_shape: (351, 11)
id: xro6r, df_shape: (8, 11)
id: 3xoj9, df_shape: (2, 11)
id: g8dp9, df_shape: (315, 11)
id: 2bbls, df_shape: (51, 11)
id: g528r, df_shape: (39,

id: go4ub, df_shape: (73, 11)
id: hdifv, df_shape: (33, 11)
id: wvwsh, df_shape: (5, 11)
id: ufgps, df_shape: (356, 11)
id: h0o7n, df_shape: (14, 11)
id: n2xg9, df_shape: (15, 11)
id: d4r41, df_shape: (8, 11)
id: 35q08, df_shape: (18, 11)
id: 2tlh7, df_shape: (301, 11)
id: nytgy, df_shape: (1, 11)
id: moftl, df_shape: (114, 11)
id: qt9nr, df_shape: (295, 11)
id: lwbzh, df_shape: (78, 11)
id: pb51b, df_shape: (76, 11)
id: 8lhtb, df_shape: (79, 11)
id: 0kr34, df_shape: (64, 11)
id: n402p, df_shape: (37, 11)
id: b6q1c, df_shape: (113, 11)
id: 44psq, df_shape: (39, 11)
id: 4szy8, df_shape: (4, 11)
id: vfcq6, df_shape: (207, 11)
id: z51fk, df_shape: (352, 11)
id: diwlw, df_shape: (54, 11)
id: 9wotz, df_shape: (161, 11)
id: 8gshg, df_shape: (130, 11)
id: rznl6, df_shape: (68, 11)
id: 1l09i, df_shape: (57, 11)
id: fx30k, df_shape: (49, 11)
id: v6l8w, df_shape: (32, 11)
id: vlycu, df_shape: (18, 11)
id: run9d, df_shape: (41, 11)
id: w6e0q, df_shape: (33, 11)
id: 0xonb, df_shape: (5, 11)
id: 8t

id: 958lf, df_shape: (498, 11)
id: mygxa, df_shape: (46, 11)
id: t6mn6, df_shape: (132, 11)
id: san5r, df_shape: (14, 11)
id: ytur6, df_shape: (328, 11)
id: fjcao, df_shape: (361, 11)
id: k5e1s, df_shape: (407, 11)
id: dg7ya, df_shape: (9, 11)
id: xhpy1, df_shape: (20, 11)
id: j84o7, df_shape: (59, 11)
id: 6nkm2, df_shape: (94, 11)
id: s0n3y, df_shape: (6, 11)
id: yh5qn, df_shape: (149, 11)
id: tngtf, df_shape: (408, 11)
id: hf4p5, df_shape: (3, 11)
id: nv0hh, df_shape: (116, 11)
id: gf0f6, df_shape: (17, 11)
id: 63gpe, df_shape: (47, 11)
id: 6b4b8, df_shape: (290, 11)
id: oiosd, df_shape: (1, 11)
id: f3ygp, df_shape: (21, 11)
id: ig4os, df_shape: (2658, 11)
id: 15hbf, df_shape: (24, 11)
id: splwk, df_shape: (34, 11)
id: nambt, df_shape: (5, 11)
id: t7uyz, df_shape: (78, 11)
id: xfxjf, df_shape: (74, 11)
id: jh92x, df_shape: (27, 11)
id: ge1wd, df_shape: (64, 11)
id: g6oi9, df_shape: (430, 11)
id: 0kkin, df_shape: (56, 11)
id: m786c, df_shape: (2, 11)
id: 9f4p0, df_shape: (105, 11)
id:

id: po4n1, df_shape: (4, 11)
id: m8n5a, df_shape: (6, 11)
id: ibqdz, df_shape: (122, 11)
id: wg73a, df_shape: (3, 11)
id: shhpd, df_shape: (9, 11)
id: xj556, df_shape: (64, 11)
id: foiao, df_shape: (144, 11)
id: 8ma79, df_shape: (35, 11)
id: fgbzp, df_shape: (36, 11)
id: zr1t0, df_shape: (50, 11)
id: 07p79, df_shape: (13, 11)
id: e3nxu, df_shape: (65, 11)
id: dx3kc, df_shape: (29, 11)
id: 4aohx, df_shape: (51, 11)
id: 83z5c, df_shape: (40, 11)
id: h4mjg, df_shape: (44, 11)
id: nrtf5, df_shape: (61, 11)
id: 6zw9u, df_shape: (7, 11)
id: wob7w, df_shape: (42, 11)
id: cchc0, df_shape: (34, 11)
id: tx9ho, df_shape: (7, 11)
id: 7vamn, df_shape: (1, 11)
id: zd902, df_shape: (7, 11)
id: i2guh, df_shape: (3, 11)
id: i42eg, df_shape: (47, 11)
id: bza6u, df_shape: (28, 11)
id: s7gwr, df_shape: (4, 11)
id: pno54, df_shape: (1, 11)
id: w7j8i, df_shape: (135, 11)
id: 6pvhb, df_shape: (4, 11)
id: ybdkf, df_shape: (63, 11)
id: h709i, df_shape: (33, 11)
id: esjfd, df_shape: (12, 11)
id: 8zaqx, df_shape

id: h6vxy, df_shape: (14, 11)
id: wcijx, df_shape: (107, 11)
id: sg3yo, df_shape: (61, 11)
id: pt2in, df_shape: (150, 11)
id: 6swh5, df_shape: (111, 11)
id: dvllu, df_shape: (825, 11)
id: 02ubh, df_shape: (26, 11)
id: l5eoj, df_shape: (13, 11)
id: hjl8g, df_shape: (36, 11)
id: zpet6, df_shape: (8, 11)
id: pwx45, df_shape: (60, 11)
id: xn0y0, df_shape: (5129, 11)
id: s1k57, df_shape: (27, 11)
id: ekmqy, df_shape: (36, 11)
id: sn980, df_shape: (10, 11)
id: nyasr, df_shape: (168, 11)
id: ujhch, df_shape: (51, 11)
id: n17ul, df_shape: (69, 11)
id: apra3, df_shape: (2, 11)
id: onhde, df_shape: (217, 11)
id: a478a, df_shape: (76, 11)
id: 9uha0, df_shape: (3, 11)
id: drbf2, df_shape: (654, 11)
id: nweau, df_shape: (156, 11)
id: ahp4j, df_shape: (68, 11)
id: kfiod, df_shape: (482, 11)
id: dyeel, df_shape: (34, 11)
id: egst6, df_shape: (1225, 11)
id: wk9cq, df_shape: (5, 11)
id: mlyy4, df_shape: (359, 11)
id: 7ig70, df_shape: (5, 11)
id: dvnw7, df_shape: (4, 11)
id: rk1nk, df_shape: (8, 11)
id:

id: rliyb, df_shape: (80, 11)
id: q1beh, df_shape: (30, 11)
id: qmfaj, df_shape: (8, 11)
id: fky7u, df_shape: (13, 11)
id: obm1n, df_shape: (103, 11)
id: rr8xe, df_shape: (61, 11)
id: 63lzy, df_shape: (2211, 11)
id: 6ddq7, df_shape: (139, 11)
id: k8ylf, df_shape: (2365, 11)
id: 7sqmh, df_shape: (1029, 11)
id: 09hjf, df_shape: (91, 11)
id: 2h4ar, df_shape: (65, 11)
id: fqzp6, df_shape: (10, 11)
id: ek230, df_shape: (3, 11)
id: tjbxy, df_shape: (7, 11)
id: l8p0t, df_shape: (12, 11)
id: rbi4i, df_shape: (6, 11)
id: 3ibfj, df_shape: (8, 11)
id: uffaq, df_shape: (130, 11)
id: 1mykd, df_shape: (21, 11)
id: iykxb, df_shape: (4, 11)
id: vtmyu, df_shape: (57, 11)
id: txxgt, df_shape: (149, 11)
id: lffzm, df_shape: (63, 11)
id: j1n99, df_shape: (3, 11)
id: ums3h, df_shape: (402, 11)
id: h581f, df_shape: (3, 11)
id: qu1ny, df_shape: (15, 11)
id: nkvze, df_shape: (17, 11)
id: f6klr, df_shape: (238, 11)
id: orfqu, df_shape: (17, 11)
id: nc4im, df_shape: (20, 11)
id: jtna5, df_shape: (377, 11)
id: e

id: goa6o, df_shape: (2199, 11)
id: nruvi, df_shape: (753, 11)
id: fa64r, df_shape: (97, 11)
id: uv790, df_shape: (10, 11)
id: xpkam, df_shape: (139, 11)
id: s2sf4, df_shape: (4, 11)
id: 0u6ql, df_shape: (230, 11)
id: hqd8e, df_shape: (64, 11)
id: i024c, df_shape: (462, 11)
id: hm94p, df_shape: (121, 11)
id: 9wv9o, df_shape: (17, 11)
id: 49mha, df_shape: (6, 11)
id: 1wcp8, df_shape: (127, 11)
id: 0ef34, df_shape: (632, 11)
id: 377io, df_shape: (78, 11)
id: 2zr59, df_shape: (1, 11)
id: 5sssg, df_shape: (31, 11)
id: qfju8, df_shape: (23, 11)
id: kpast, df_shape: (59, 11)
id: 15cms, df_shape: (412, 11)
id: gidpp, df_shape: (421, 11)
id: knakj, df_shape: (147, 11)
id: zgyrr, df_shape: (323, 11)
id: 5h7dw, df_shape: (40, 11)
id: qe4te, df_shape: (618, 11)
id: ga10e, df_shape: (6, 11)
id: g2bvb, df_shape: (490, 11)
id: bvu6v, df_shape: (365, 11)
id: z971k, df_shape: (11, 11)
id: qipzz, df_shape: (589, 11)
id: fr3kh, df_shape: (327, 11)
id: a80g3, df_shape: (360, 11)
id: akp6h, df_shape: (30,

id: ofa24, df_shape: (251, 11)
id: mdbii, df_shape: (2, 11)
id: feuyx, df_shape: (323, 11)
id: 5eddt, df_shape: (88, 11)
id: obts3, df_shape: (162, 11)
id: 9iayu, df_shape: (335, 11)
id: ipdmo, df_shape: (242, 11)
id: j4azq, df_shape: (6, 11)
id: lw44y, df_shape: (360, 11)
id: 10zxz, df_shape: (28, 11)
id: rjqk0, df_shape: (83, 11)
id: rk3am, df_shape: (155, 11)
id: c2t3v, df_shape: (105, 11)
id: mmmhw, df_shape: (1, 11)
id: gxdo2, df_shape: (15, 11)
id: k4ucl, df_shape: (26, 11)
id: zj05b, df_shape: (3, 11)
id: izc3e, df_shape: (6, 11)
id: e0cnb, df_shape: (15, 11)
id: phgwj, df_shape: (3, 11)
id: kcp09, df_shape: (2, 11)
id: 8380x, df_shape: (48, 11)
id: 5l79f, df_shape: (101, 11)
id: hs26g, df_shape: (1, 11)
id: 0y20x, df_shape: (45, 11)
id: 9xkhm, df_shape: (2, 11)
id: 9ars3, df_shape: (4, 11)
id: 6txma, df_shape: (843, 11)
id: a2cr7, df_shape: (45, 11)
id: vhmlk, df_shape: (8, 11)
id: 5jfb6, df_shape: (1, 11)
id: n6fg8, df_shape: (141, 11)
id: 6rrbv, df_shape: (74, 11)
id: x8dpy, 

id: 39zoz, df_shape: (56, 11)
id: 96kfk, df_shape: (29, 11)
id: psudh, df_shape: (107, 11)
id: 7hzsc, df_shape: (1061, 11)
id: pd58b, df_shape: (15, 11)
id: 0q8ac, df_shape: (909, 11)
id: ugmhd, df_shape: (126, 11)
id: xebep, df_shape: (67, 11)
id: kudli, df_shape: (83, 11)
id: v1el8, df_shape: (5, 11)
id: 0k63p, df_shape: (15, 11)
id: 55sgd, df_shape: (51, 11)
id: uirns, df_shape: (1869, 11)
id: 3i7d9, df_shape: (71, 11)
id: ixnkd, df_shape: (17, 11)
id: shv7g, df_shape: (163, 11)
id: yww90, df_shape: (8, 11)
id: wm9nb, df_shape: (103, 11)
id: 7qv75, df_shape: (38, 11)
id: dm5d1, df_shape: (377, 11)
id: jmf5l, df_shape: (101, 11)
id: uoyt7, df_shape: (590, 11)
id: nvq17, df_shape: (293, 11)
id: pjhd9, df_shape: (240, 11)
id: qga09, df_shape: (1459, 11)
id: jzwu0, df_shape: (202, 11)
id: opude, df_shape: (465, 11)
id: zq69v, df_shape: (451, 11)
id: ymwky, df_shape: (289, 11)
id: 6baq7, df_shape: (133, 11)
id: r5dty, df_shape: (210, 11)
id: bzncd, df_shape: (211, 11)
id: eotxd, df_shape

id: razqd, df_shape: (4, 11)
id: 2pvlr, df_shape: (1, 11)
id: rr1s7, df_shape: (21, 11)
id: 1rhkc, df_shape: (14, 11)
id: g75xd, df_shape: (116, 11)
id: a1swj, df_shape: (4, 11)
id: s074e, df_shape: (24, 11)
id: j2d27, df_shape: (53, 11)
id: gpyyh, df_shape: (147, 11)
id: a64zd, df_shape: (10, 11)
id: qzefl, df_shape: (23, 11)
id: 42887, df_shape: (58, 11)
id: mmgbq, df_shape: (131, 11)
id: mf40s, df_shape: (5, 11)
id: gwwzk, df_shape: (85, 11)
id: 2f49v, df_shape: (32, 11)
id: tsgo0, df_shape: (129, 11)
id: 30jdh, df_shape: (20, 11)
id: i297h, df_shape: (113, 11)
id: amuwu, df_shape: (39, 11)
id: pudtc, df_shape: (116, 11)
id: xr5uz, df_shape: (942, 11)
id: aioij, df_shape: (11, 11)
id: e6mrf, df_shape: (6, 11)
id: j1e00, df_shape: (4, 11)
id: vuqd1, df_shape: (25, 11)
id: es3kc, df_shape: (11, 11)
id: mhd2x, df_shape: (25, 11)
id: um31v, df_shape: (19, 11)
id: 8osdn, df_shape: (23, 11)
id: hj8j0, df_shape: (370, 11)
id: af3ni, df_shape: (4, 11)
id: z2lp7, df_shape: (80, 11)
id: 5nn1v

id: zlmi4, df_shape: (26, 11)
id: kbfgd, df_shape: (15, 11)
id: e8vdj, df_shape: (6, 11)
id: xhmge, df_shape: (8, 11)
id: 8khcv, df_shape: (95, 11)
id: 7b9jg, df_shape: (22, 11)
id: 36pbn, df_shape: (6, 11)
id: xw0lt, df_shape: (7, 11)
id: ebdjg, df_shape: (7, 11)
id: faxz5, df_shape: (11, 11)
id: oovpg, df_shape: (8, 11)
id: i4qyw, df_shape: (4, 11)
id: 2t9eo, df_shape: (1, 11)
id: ux0ov, df_shape: (2, 11)
id: u0rwf, df_shape: (1, 11)
id: c0wi0, df_shape: (13, 11)
id: qfq8l, df_shape: (177, 11)
id: ndprt, df_shape: (3, 11)
id: faldg, df_shape: (7, 11)
id: 2b1wq, df_shape: (400, 11)
id: z7b8k, df_shape: (1, 11)
id: bo17h, df_shape: (1, 11)
id: l2rpu, df_shape: (120, 11)
id: iewnq, df_shape: (8, 11)
id: vk2v6, df_shape: (129, 11)
id: 1q2mp, df_shape: (58, 11)
id: l48yf, df_shape: (12, 11)
id: vonm3, df_shape: (2, 11)
id: 14lmx, df_shape: (2, 11)
id: oerpi, df_shape: (11, 11)
id: 16j4e, df_shape: (14, 11)
id: egghr, df_shape: (3, 11)
id: b1fe8, df_shape: (13, 11)
id: 31ggk, df_shape: (55

id: 7noeq, df_shape: (600, 11)
id: 1lxsk, df_shape: (170, 11)
id: cn4k4, df_shape: (999, 11)
id: xxzjn, df_shape: (1691, 11)
id: 6r8zk, df_shape: (66, 11)
id: gzzks, df_shape: (174, 11)
id: 5id7j, df_shape: (355, 11)
id: rn6ir, df_shape: (62, 11)
id: lqa0n, df_shape: (551, 11)
id: 64kx3, df_shape: (56, 11)
id: r4a9h, df_shape: (85, 11)
id: aw1m4, df_shape: (9, 11)
id: gwob3, df_shape: (63, 11)
id: ri8ni, df_shape: (158, 11)
id: x7mge, df_shape: (523, 11)
id: 18nth, df_shape: (2065, 11)
id: rw47l, df_shape: (41, 11)
id: jt2m8, df_shape: (164, 11)
id: fsbi2, df_shape: (349, 11)
id: 8f75q, df_shape: (12, 11)
id: slgg9, df_shape: (83, 11)
id: fsqsp, df_shape: (3, 11)
id: 34mps, df_shape: (1051, 11)
id: g6w6r, df_shape: (49, 11)
id: snijl, df_shape: (44, 11)
id: gxptf, df_shape: (27, 11)
id: 1cbiu, df_shape: (1609, 11)
id: sdve3, df_shape: (12, 11)
id: zcuuc, df_shape: (201, 11)
id: 8advj, df_shape: (23, 11)
id: ro7gn, df_shape: (4, 11)
id: 45m4f, df_shape: (19, 11)
id: 89xye, df_shape: (15

id: 75f7v, df_shape: (43, 11)
id: xkxv3, df_shape: (321, 11)
id: pqjs4, df_shape: (183, 11)
id: uk2gn, df_shape: (236, 11)
id: ffx97, df_shape: (52, 11)
id: 0dm6m, df_shape: (31, 11)
id: 2udn9, df_shape: (14, 11)
id: ryso3, df_shape: (64, 11)
id: us5g1, df_shape: (14, 11)
id: 0mdgt, df_shape: (717, 11)
id: mndls, df_shape: (263, 11)
id: 6ajnk, df_shape: (80, 11)
id: hdghi, df_shape: (106, 11)
id: ti510, df_shape: (5, 11)
id: nu8ru, df_shape: (58, 11)
id: z8802, df_shape: (55, 11)
id: fw28c, df_shape: (37, 11)
id: i9ryp, df_shape: (39, 11)
id: dxbe7, df_shape: (65, 11)
id: zwqah, df_shape: (43, 11)
id: p2zwg, df_shape: (37, 11)
id: 532t4, df_shape: (5, 11)
id: flfxq, df_shape: (37, 11)
id: jtbzp, df_shape: (80, 11)
id: qj82o, df_shape: (56, 11)
id: bg1xc, df_shape: (1387, 11)
id: oco8q, df_shape: (308, 11)
id: p5892, df_shape: (11, 11)
id: mub7g, df_shape: (78, 11)
id: wdr5u, df_shape: (20, 11)
id: ueglr, df_shape: (56, 11)
id: 38phk, df_shape: (70, 11)
id: 3ca8f, df_shape: (13, 11)
id:

id: rnfgn, df_shape: (6, 11)
id: o2iim, df_shape: (8, 11)
id: 8w1pz, df_shape: (7, 11)
id: b4q07, df_shape: (1, 11)
id: 13kbi, df_shape: (11, 11)
id: p9i74, df_shape: (3, 11)
id: ogd9g, df_shape: (4, 11)
id: c4ytj, df_shape: (35, 11)
id: mrha8, df_shape: (20, 11)
id: 9gfkc, df_shape: (75, 11)
id: 4smkb, df_shape: (25, 11)
id: gz4s6, df_shape: (33, 11)
id: wex35, df_shape: (55, 11)
id: 8akx1, df_shape: (11, 11)
id: wvwl4, df_shape: (17, 11)
id: gwshe, df_shape: (2, 11)
id: smx0t, df_shape: (1, 11)
id: kq5a1, df_shape: (6, 11)
id: gai7f, df_shape: (10, 11)
id: es5a0, df_shape: (27, 11)
id: zz2r1, df_shape: (69, 11)
id: z09mu, df_shape: (24, 11)
id: evqlu, df_shape: (104, 11)
id: mq84j, df_shape: (1, 11)
id: soyrb, df_shape: (1, 11)
id: 76rpm, df_shape: (12, 11)
id: j8xgh, df_shape: (27, 11)
id: 4wbx3, df_shape: (57, 11)
id: 33p2a, df_shape: (818, 11)
id: 11rf1, df_shape: (8, 11)
id: a9v97, df_shape: (84, 11)
id: 7sfhp, df_shape: (58, 11)
id: z285o, df_shape: (10, 11)
id: ocz8s, df_shape:

id: m7pi4, df_shape: (1, 11)
id: u9gsl, df_shape: (2, 11)
id: sr9vw, df_shape: (40, 11)
id: 26esw, df_shape: (1, 11)
id: 08wsg, df_shape: (6, 11)
id: vijsj, df_shape: (126, 11)
id: tusaa, df_shape: (13, 11)
id: 30n9g, df_shape: (70, 11)
id: flslr, df_shape: (35, 11)
id: 5w3lk, df_shape: (20, 11)
id: vjpu7, df_shape: (16, 11)
id: zbohz, df_shape: (3, 11)
id: z0z2m, df_shape: (1, 11)
id: 5vlfc, df_shape: (7, 11)
id: qhllq, df_shape: (6, 11)
id: 79kb3, df_shape: (7, 11)
id: vlmwi, df_shape: (7, 11)
id: sxthd, df_shape: (11, 11)
id: 8suk9, df_shape: (5, 11)
id: cnfkg, df_shape: (97, 11)
id: gjkss, df_shape: (1, 11)
id: igx27, df_shape: (3, 11)
id: 7t0q1, df_shape: (15, 11)
id: 2bzr0, df_shape: (3, 11)
id: w8dq5, df_shape: (4, 11)
id: ijcyy, df_shape: (9, 11)
id: esjjc, df_shape: (15, 11)
id: 3kn4y, df_shape: (2, 11)
id: m946j, df_shape: (9, 11)
id: i01xm, df_shape: (3, 11)
id: gq1zf, df_shape: (102, 11)
id: f6rj3, df_shape: (6, 11)
id: ysaa6, df_shape: (9, 11)
id: t9958, df_shape: (33, 11)

id: 8abt3, df_shape: (2, 11)
id: eg4i1, df_shape: (224, 11)
id: 4lwwb, df_shape: (1, 11)
id: 209ix, df_shape: (498, 11)
id: 73alw, df_shape: (3, 11)
id: zn8qm, df_shape: (4, 11)
id: jbhtn, df_shape: (58, 11)
id: eb7uq, df_shape: (22, 11)
id: fexar, df_shape: (8, 11)
id: 4o9t8, df_shape: (46, 11)
id: u6jvr, df_shape: (2, 11)
id: i1kwk, df_shape: (16, 11)
id: v5gwc, df_shape: (1, 11)
id: v7y8z, df_shape: (2, 11)
id: o5t8l, df_shape: (36, 11)
id: qpxkt, df_shape: (108, 11)
id: 2jffg, df_shape: (2, 11)
id: ta9nh, df_shape: (9, 11)
id: oezt7, df_shape: (413, 11)
id: zle48, df_shape: (5, 11)
id: i1bpi, df_shape: (2, 11)
id: oqz76, df_shape: (1, 11)
id: 0kr63, df_shape: (9, 11)
id: j1aql, df_shape: (1, 11)
id: h9kui, df_shape: (22, 11)
id: 22ckt, df_shape: (219, 11)
id: c24jt, df_shape: (20, 11)
id: exkvk, df_shape: (127, 11)
id: cjx5x, df_shape: (2, 11)
id: mvxe5, df_shape: (2, 11)
id: 0leo6, df_shape: (49, 11)
id: x0ws4, df_shape: (1, 11)
id: ut42l, df_shape: (17, 11)
id: 1j0uj, df_shape: (

id: hoqmd, df_shape: (1, 11)
id: ktgq5, df_shape: (5, 11)
id: nfntk, df_shape: (17, 11)
id: iiy9k, df_shape: (11, 11)
id: ffowb, df_shape: (18, 11)
id: qjhoa, df_shape: (11, 11)
id: pa0rh, df_shape: (30, 11)
id: vr9pf, df_shape: (25, 11)
id: 3u4o6, df_shape: (4, 11)
id: 472i2, df_shape: (6, 11)
id: i84z1, df_shape: (9, 11)
id: rmlu1, df_shape: (1, 11)
id: bo9ey, df_shape: (143, 11)
id: emm20, df_shape: (48, 11)
id: ckvro, df_shape: (3, 11)
id: 8b06o, df_shape: (28, 11)
id: s3byk, df_shape: (25, 11)
id: 3ng3k, df_shape: (45, 11)
id: nth97, df_shape: (19, 11)
id: r6lqf, df_shape: (51, 11)
id: zp8rt, df_shape: (2, 11)
id: 3ax98, df_shape: (1, 11)
id: n6pf3, df_shape: (9, 11)
id: x4n84, df_shape: (117, 11)
id: hvx7x, df_shape: (1, 11)
id: raqlf, df_shape: (25, 11)
id: kokd6, df_shape: (2, 11)
id: klnv5, df_shape: (6, 11)
id: o6dg6, df_shape: (3, 11)
id: 552rz, df_shape: (141, 11)
id: 8ywtc, df_shape: (13, 11)
id: uv29c, df_shape: (2, 11)
id: 1gk1b, df_shape: (9, 11)
id: 33j0n, df_shape: (3

id: f29cn, df_shape: (13, 11)
id: 12woo, df_shape: (3, 11)
id: a06bm, df_shape: (4, 11)
id: m3b4r, df_shape: (1, 11)
id: 09wll, df_shape: (1, 11)
id: jxq9v, df_shape: (31, 11)
id: ybat3, df_shape: (26, 11)
id: z6x1f, df_shape: (10, 11)
id: r9lhv, df_shape: (2, 11)
id: gzy7r, df_shape: (2, 11)
id: abx1x, df_shape: (5, 11)
id: 80fpl, df_shape: (1, 11)
id: 3xwmb, df_shape: (6, 11)
id: w943b, df_shape: (247, 11)
id: o669n, df_shape: (4, 11)
id: 8laun, df_shape: (3, 11)
id: g2qrd, df_shape: (7, 11)
id: agqzd, df_shape: (17, 11)
id: b2454, df_shape: (8, 11)
id: p1lop, df_shape: (3681, 11)
id: mgd7p, df_shape: (70, 11)
id: g97i9, df_shape: (94, 11)
id: 60jh8, df_shape: (112, 11)
id: k2h7k, df_shape: (494, 11)
id: 8p2zj, df_shape: (74, 11)
id: 1378d, df_shape: (104, 11)
id: f70nu, df_shape: (1, 11)
id: czhtz, df_shape: (1, 11)
id: yc3ve, df_shape: (8, 11)
id: 1ay6c, df_shape: (8, 11)
id: 6lvrx, df_shape: (9, 11)
id: zm0jf, df_shape: (7, 11)
id: sjs74, df_shape: (1, 11)
id: un4gz, df_shape: (56

id: bq24m, df_shape: (2, 11)
id: p99ju, df_shape: (1, 11)
id: fzrp2, df_shape: (116, 11)
id: 70m6x, df_shape: (64, 11)
id: icbes, df_shape: (11, 11)
id: 03ou3, df_shape: (153, 11)
id: dmuja, df_shape: (8, 11)
id: 2vm3i, df_shape: (8, 11)
id: 59jq8, df_shape: (16, 11)
id: z4ox4, df_shape: (2, 11)
id: iawgq, df_shape: (22, 11)
id: e7tpm, df_shape: (106, 11)
id: lbev8, df_shape: (3, 11)
id: 1seb3, df_shape: (47, 11)
id: 2sdhn, df_shape: (2, 11)
id: ck1ac, df_shape: (1, 11)
id: xb9uo, df_shape: (155, 11)
id: zhr0p, df_shape: (2, 11)
id: esio3, df_shape: (4, 11)
id: mbh7p, df_shape: (16, 11)
id: 686ad, df_shape: (6, 11)
id: pvmaz, df_shape: (123, 11)
id: cr2qq, df_shape: (7, 11)
id: izhzc, df_shape: (1, 11)
id: jg06f, df_shape: (5, 11)
id: n91wz, df_shape: (74, 11)
id: zkb6z, df_shape: (7, 11)
id: 5hzoe, df_shape: (1, 11)
id: p3vbc, df_shape: (2, 11)
id: qkwvg, df_shape: (40, 11)
id: w1jmm, df_shape: (7, 11)
id: z8av7, df_shape: (13, 11)
id: 9bhxl, df_shape: (25, 11)
id: bde7q, df_shape: (6

id: i3e7z, df_shape: (53, 11)
id: 9p9vr, df_shape: (37, 11)
id: bkv1k, df_shape: (34, 11)
id: 1gvgi, df_shape: (47, 11)
id: e7qzd, df_shape: (2, 11)
id: usmc2, df_shape: (13, 11)
id: x39bn, df_shape: (22, 11)
id: j39p0, df_shape: (20, 11)
id: tduy8, df_shape: (24, 11)
id: nr2hj, df_shape: (1, 11)
id: yhyyn, df_shape: (52, 11)
id: 3s5iv, df_shape: (7, 11)
id: zufii, df_shape: (23, 11)
id: 9c98s, df_shape: (31, 11)
id: bsijt, df_shape: (7, 11)
id: 86gjb, df_shape: (8, 11)
id: 2z8ru, df_shape: (4, 11)
id: e712f, df_shape: (17, 11)
id: jiu54, df_shape: (18, 11)
id: u8hh3, df_shape: (9, 11)
id: cbmii, df_shape: (37, 11)
id: 1ptl7, df_shape: (14, 11)
id: 7hwup, df_shape: (5, 11)
id: 3ti3a, df_shape: (1, 11)
id: 2b2si, df_shape: (4, 11)
id: c0bgr, df_shape: (2, 11)
id: ec0vy, df_shape: (18, 11)
id: zwwia, df_shape: (20, 11)
id: ta429, df_shape: (2, 11)
id: elnor, df_shape: (2, 11)
id: nqovk, df_shape: (1, 11)
id: glfco, df_shape: (2, 11)
id: i5uv7, df_shape: (12, 11)
id: 9iykh, df_shape: (4, 

id: gl2rh, df_shape: (5, 11)
id: d01i3, df_shape: (8, 11)
id: ctsa9, df_shape: (1, 11)
id: aumfc, df_shape: (3, 11)
id: zuj9f, df_shape: (7, 11)
id: bmutq, df_shape: (2, 11)
id: oq63i, df_shape: (4, 11)
id: 45osy, df_shape: (2, 11)
id: ygvnj, df_shape: (1, 11)
id: f26fn, df_shape: (2, 11)
id: a8n9n, df_shape: (3, 11)
id: tszwv, df_shape: (1, 11)
id: eq3q9, df_shape: (6, 11)
id: mdhrj, df_shape: (1, 11)
id: bpdd6, df_shape: (10, 11)
id: v4w6f, df_shape: (5, 11)
id: kpn31, df_shape: (1, 11)
id: 63znt, df_shape: (1, 11)
id: ildwi, df_shape: (7, 11)
id: yhaun, df_shape: (1, 11)
id: l2toz, df_shape: (1, 11)
id: zsvgj, df_shape: (3, 11)
id: w2az3, df_shape: (1, 11)
id: u78jm, df_shape: (1, 11)
id: zhlnb, df_shape: (5, 11)
id: e0s3b, df_shape: (4, 11)
id: kq0o0, df_shape: (2, 11)
id: nizmc, df_shape: (2, 11)
id: drbt1, df_shape: (1, 11)
id: lpdrn, df_shape: (2, 11)
id: nj8ci, df_shape: (7, 11)
id: ba07u, df_shape: (1, 11)
id: bc3eo, df_shape: (1, 11)
id: mvck2, df_shape: (4, 11)
id: wg3ye, df

id: 12rsq, df_shape: (73, 11)
id: l3bnj, df_shape: (19, 11)
id: 9jykv, df_shape: (1, 11)
id: nul8e, df_shape: (1, 11)
id: opx5m, df_shape: (2, 11)
id: ybqvc, df_shape: (3, 11)
id: 1vsk4, df_shape: (1, 11)
id: owehg, df_shape: (23, 11)
id: 1rols, df_shape: (38, 11)
id: mjnpe, df_shape: (1, 11)
id: 5tz3u, df_shape: (1, 11)
id: fx4nt, df_shape: (1, 11)
id: camme, df_shape: (3, 11)
id: 9lqrt, df_shape: (1, 11)
id: 9fwa1, df_shape: (1, 11)
id: rxvls, df_shape: (1, 11)
id: iz29h, df_shape: (6, 11)
id: lr9ih, df_shape: (10, 11)
id: mi86m, df_shape: (1, 11)
id: g5gk0, df_shape: (1, 11)
id: nsqnh, df_shape: (7, 11)
id: uikzo, df_shape: (1, 11)
id: 857j2, df_shape: (4, 11)
id: s6buw, df_shape: (10, 11)
id: hdx8h, df_shape: (1, 11)
id: 925gt, df_shape: (1, 11)
id: h4poo, df_shape: (2, 11)
id: a95bg, df_shape: (3, 11)
id: birmg, df_shape: (1, 11)
id: mm3ln, df_shape: (3, 11)
id: byg6g, df_shape: (2, 11)
id: bhuzo, df_shape: (2, 11)
id: xjrbu, df_shape: (1, 11)
id: cq4uy, df_shape: (1, 11)
id: wx71

In [220]:
len(auction_dictinoary)

13999

## get single auction to test with

In [221]:
df = auction_dictinoary['zz4dz'].copy(deep=True)

# add temporal difference between bids
df['date_time'] = pd.to_datetime(df['time'])

df = df.sort_values(['date_time']) # must sort by date some funny stuff with index happens

tdelta = df['date_time'].diff()
tdelta.fillna(0 , inplace=True)
df['time_delta_auction_bids'] = pd.to_timedelta(tdelta) / np.timedelta64(1, 's')

df = df.reset_index()

In [222]:
df[1:]['time_delta_auction_bids'].describe()

count      99.000000
mean      109.590112
std       520.058652
min         0.157895
25%         6.315789
50%        20.052632
75%        43.842105
max      4273.473684
Name: time_delta_auction_bids, dtype: float64

In [223]:
# get describe series (not including first row delta will always be 0)
describe_of_time_delta_auction_bids = df[1:]['time_delta_auction_bids'].describe()

# get axes labels for label describe
describe_axes = describe_of_time_delta_auction_bids.axes[0]
describe_axes

# add distrubtion of deltas data
for i in range(1, len(describe_axes)):
    df['{}_{}'.format('time_delta_auction_bids', describe_axes[i])] = describe_of_time_delta_auction_bids[i]
    
df['time_delta_bids_in_auction_median'] = df[1:]['time_delta_auction_bids'].median()
df['time_delta_bids_in_auction_kurtosis'] = df[1:]['time_delta_auction_bids'].kurtosis()
df['total_bids_in_auction'] = df.shape[0] # total bid count

df['first_auction_bid'] = 0
df['last_auction_bid'] = 0
df.iloc[0, df.columns.get_loc('first_auction_bid')] = 1
df.iloc[df.shape[0] - 1, df.columns.get_loc('last_auction_bid')] = 1

In [224]:
df.head(10)

Unnamed: 0,index,bid_id,bidder_id,auction,merchandise,device,time,country,ip,url,payment_account,address,date_time,time_delta_auction_bids,time_delta_auction_bids_mean,time_delta_auction_bids_std,time_delta_auction_bids_min,time_delta_auction_bids_25%,time_delta_auction_bids_50%,time_delta_auction_bids_75%,time_delta_auction_bids_max,time_delta_bids_in_auction_median,time_delta_bids_in_auction_kurtosis,total_bids_in_auction,first_auction_bid,last_auction_bid
0,275163,16058,d174177146370aacbd5ae107b6be78828tx3e,zz4dz,home goods,phone35,9759296263157894,id,177.47.141.241,vasstdc27m7nks3,a3d2de7675556553a5f08e4c88d2c228hf8ol,a3d2de7675556553a5f08e4c88d2c228f3rnz,1970-04-23 22:54:56.263157894,0.0,109.590112,520.058652,0.157895,6.315789,20.052632,43.842105,4273.473684,20.052632,51.790288,100,1,0
1,1358525,21730,de6958a61ea1eff953cf7920213437769l52k,zz4dz,sporting goods,phone41,9759311000000000,id,221.23.35.241,5v4j0726m1kzq4x,1803011a1b59e0a302edcd0ddc50bc39ca2xj,60f712920e06473169a6feebe65448edhx6kv,1970-04-23 22:55:11.000000000,14.736842,109.590112,520.058652,0.157895,6.315789,20.052632,43.842105,4273.473684,20.052632,51.790288,100,0,0
2,275400,43900,d174177146370aacbd5ae107b6be78828tx3e,zz4dz,home goods,phone45,9759371526315789,id,228.239.59.50,vasstdc27m7nks3,a3d2de7675556553a5f08e4c88d2c228hf8ol,a3d2de7675556553a5f08e4c88d2c228f3rnz,1970-04-23 22:56:11.526315789,60.526316,109.590112,520.058652,0.157895,6.315789,20.052632,43.842105,4273.473684,20.052632,51.790288,100,0,0
3,1253272,47889,ffd62646d600b759a985d45918bd6f0431vmz,zz4dz,mobile,phone4,9759382578947368,id,220.216.170.202,vasstdc27m7nks3,a3d2de7675556553a5f08e4c88d2c228qdyy3,a3d2de7675556553a5f08e4c88d2c22847ays,1970-04-23 22:56:22.578947368,11.052632,109.590112,520.058652,0.157895,6.315789,20.052632,43.842105,4273.473684,20.052632,51.790288,100,0,0
4,275459,50397,d174177146370aacbd5ae107b6be78828tx3e,zz4dz,home goods,phone35,9759389736842105,id,47.26.163.208,vasstdc27m7nks3,a3d2de7675556553a5f08e4c88d2c228hf8ol,a3d2de7675556553a5f08e4c88d2c228f3rnz,1970-04-23 22:56:29.736842105,7.157895,109.590112,520.058652,0.157895,6.315789,20.052632,43.842105,4273.473684,20.052632,51.790288,100,0,0
5,275493,54957,d174177146370aacbd5ae107b6be78828tx3e,zz4dz,home goods,phone228,9759402789473684,id,3.210.112.183,vasstdc27m7nks3,a3d2de7675556553a5f08e4c88d2c228hf8ol,a3d2de7675556553a5f08e4c88d2c228f3rnz,1970-04-23 22:56:42.789473684,13.052632,109.590112,520.058652,0.157895,6.315789,20.052632,43.842105,4273.473684,20.052632,51.790288,100,0,0
6,275590,68661,d174177146370aacbd5ae107b6be78828tx3e,zz4dz,home goods,phone26,9759442157894736,id,39.0.169.174,vasstdc27m7nks3,a3d2de7675556553a5f08e4c88d2c228hf8ol,a3d2de7675556553a5f08e4c88d2c228f3rnz,1970-04-23 22:57:22.157894736,39.368421,109.590112,520.058652,0.157895,6.315789,20.052632,43.842105,4273.473684,20.052632,51.790288,100,0,0
7,1124829,76120,4b8a1c9b43261dcf750eedee25978bbfp7yrj,zz4dz,mobile,phone222,9759462631578947,id,185.16.249.85,a36yq541h3oifcb,7081754574845aabc6871c3d42df200fnyedl,acab65e927840c8d2c16e25cd1329de4x8bmo,1970-04-23 22:57:42.631578947,20.473684,109.590112,520.058652,0.157895,6.315789,20.052632,43.842105,4273.473684,20.052632,51.790288,100,0,0
8,1124830,77070,4b8a1c9b43261dcf750eedee25978bbfp7yrj,zz4dz,mobile,phone222,9759465157894736,id,185.16.249.85,a36yq541h3oifcb,7081754574845aabc6871c3d42df200fnyedl,acab65e927840c8d2c16e25cd1329de4x8bmo,1970-04-23 22:57:45.157894736,2.526316,109.590112,520.058652,0.157895,6.315789,20.052632,43.842105,4273.473684,20.052632,51.790288,100,0,0
9,1124832,79090,4b8a1c9b43261dcf750eedee25978bbfp7yrj,zz4dz,mobile,phone28,9759470789473684,id,220.216.170.202,peqxikkfl76rdpd,7081754574845aabc6871c3d42df200fnyedl,acab65e927840c8d2c16e25cd1329de4x8bmo,1970-04-23 22:57:50.789473684,5.631579,109.590112,520.058652,0.157895,6.315789,20.052632,43.842105,4273.473684,20.052632,51.790288,100,0,0


In [225]:
list_of_df = []


for auction in auction_dictinoary:
    
    df = auction_dictinoary[auction]
    
    # add temporal difference between bids
    df['date_time'] = pd.to_datetime(df['time'])

    # must sort by date some funny stuff with index happens
    df = df.sort_values(['date_time']) 

    tdelta = df['date_time'].diff()
    tdelta.fillna(0 , inplace=True)
    df['time_delta_auction_bids'] = pd.to_timedelta(tdelta) / np.timedelta64(1, 's')

    df = df.reset_index()
    
    # get describe series (not including first row delta will always be 0)
    describe_of_time_delta_auction_bids = df[1:]['time_delta_auction_bids'].describe()

    # get axes labels for label describe
    describe_axes = describe_of_time_delta_auction_bids.axes[0]
    describe_axes

    # add distrubtion of deltas data
    for i in range(1, len(describe_axes)):
        df['{}_{}'.format('time_delta_auction_bids', describe_axes[i])] = describe_of_time_delta_auction_bids[i]

    df['time_delta_bids_in_auction_median'] = df[1:]['time_delta_auction_bids'].median()
    df['time_delta_bids_in_auction_kurtosis'] = df[1:]['time_delta_auction_bids'].kurtosis()
    df['total_bids_in_auction'] = df.shape[0] # total bid count
    
    # add column to show if this was first and last bid in auction
    df['first_auction_bid'] = 0
    df['last_auction_bid'] = 0
    df.iloc[0, df.columns.get_loc('first_auction_bid')] = 1
    df.iloc[df.shape[0] - 1, df.columns.get_loc('last_auction_bid')] = 1
    
    list_of_df.append(df)


unordered_df = pd.concat(list_of_df, ignore_index=True)

A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: http://pandas.pydata.org/pandas-docs/stable/indexing.html#indexing-view-versus-copy


In [230]:
# (3071224, 27) shape of training
# (4585110, 26) shape of testing
unordered_df.shape

(4585110, 26)

In [231]:
unordered_df.head(10)

Unnamed: 0,index,bid_id,bidder_id,auction,merchandise,device,time,country,ip,url,payment_account,address,date_time,time_delta_auction_bids,time_delta_auction_bids_mean,time_delta_auction_bids_std,time_delta_auction_bids_min,time_delta_auction_bids_25%,time_delta_auction_bids_50%,time_delta_auction_bids_75%,time_delta_auction_bids_max,time_delta_bids_in_auction_median,time_delta_bids_in_auction_kurtosis,total_bids_in_auction,first_auction_bid,last_auction_bid
0,0,0,8dac2b259fd1c6d1120e519fb1ac14fbqvax8,ewmzr,jewelry,phone0,9759243157894736,us,69.166.231.58,vasstdc27m7nks3,a3d2de7675556553a5f08e4c88d2c2282ay1v,7f4c6ac489cbd95e38e4f093bb308af5jae25,1970-04-23 22:54:03.157894736,0.0,6.594607,10.63153,0.0,0.631579,2.473684,8.052632,111.105263,2.473684,19.24391,2068,1,0
1,362389,30,708ba5d36271639a9003ace4dc2cc540mugek,ewmzr,mobile,phone27,9759243315789473,us,196.99.84.184,a1qvn2e5zlg48fw,a3d2de7675556553a5f08e4c88d2c228pico6,3e925d082f80fd4fb458fca0f909d8b0sfgwb,1970-04-23 22:54:03.315789473,0.157895,6.594607,10.63153,0.0,0.631579,2.473684,8.052632,111.105263,2.473684,19.24391,2068,0,0
2,481836,67,2419ed502cf6b4cc6feb0a47697a045b4gqiq,ewmzr,mobile,phone55,9759243473684210,us,231.63.201.73,vasstdc27m7nks3,d7f36c1e7caaa3914c36033442b56b861laao,f326c75ac92f64210b37b3f44e24ee8ar7dij,1970-04-23 22:54:03.473684210,0.157895,6.594607,10.63153,0.0,0.631579,2.473684,8.052632,111.105263,2.473684,19.24391,2068,0,0
3,8,421,8dac2b259fd1c6d1120e519fb1ac14fbqvax8,ewmzr,jewelry,phone0,9759245368421052,us,69.166.231.58,vasstdc27m7nks3,a3d2de7675556553a5f08e4c88d2c2282ay1v,7f4c6ac489cbd95e38e4f093bb308af5jae25,1970-04-23 22:54:05.368421052,1.894737,6.594607,10.63153,0.0,0.631579,2.473684,8.052632,111.105263,2.473684,19.24391,2068,0,0
4,235279,509,ffbc0fdfbf19a8a9116b68714138f2902cc13,ewmzr,mobile,phone126,9759245842105263,us,143.106.183.245,xscesvsk920626v,940251010efee6b9b24ca095b1edf6e7pfrtb,1a06878ed1aa10e72c3cbeaf37639d231nvu1,1970-04-23 22:54:05.842105263,0.473684,6.594607,10.63153,0.0,0.631579,2.473684,8.052632,111.105263,2.473684,19.24391,2068,0,0
5,1042508,610,8eb7051f291a31dd19950b100722419b633td,ewmzr,mobile,phone237,9759246473684210,us,73.74.178.1,x2356876p4ypa7j,a3d2de7675556553a5f08e4c88d2c228zjtpq,a83115083bab1ec3420c5845b9de5721p0mit,1970-04-23 22:54:06.473684210,0.631579,6.594607,10.63153,0.0,0.631579,2.473684,8.052632,111.105263,2.473684,19.24391,2068,0,0
6,1042509,618,8eb7051f291a31dd19950b100722419b633td,ewmzr,mobile,phone237,9759246526315789,us,73.74.178.1,x2356876p4ypa7j,a3d2de7675556553a5f08e4c88d2c228zjtpq,a83115083bab1ec3420c5845b9de5721p0mit,1970-04-23 22:54:06.526315789,0.052632,6.594607,10.63153,0.0,0.631579,2.473684,8.052632,111.105263,2.473684,19.24391,2068,0,0
7,999669,646,5fcec311d29fdcdc8f1b662eb2068997xt2oc,ewmzr,sporting goods,phone23,9759246631578947,us,51.79.186.54,vasstdc27m7nks3,a3d2de7675556553a5f08e4c88d2c228jxbbd,a3d2de7675556553a5f08e4c88d2c228u78kn,1970-04-23 22:54:06.631578947,0.105263,6.594607,10.63153,0.0,0.631579,2.473684,8.052632,111.105263,2.473684,19.24391,2068,0,0
8,871372,670,713fa3177b9c9c7c92cc9f74b71e84db0tss4,ewmzr,sporting goods,phone8,9759246789473684,us,160.9.191.22,fm6jlgjh9fjbddz,dff57801408b67a54c032984322d8443mkkd8,61877e8b75ca913326bc1e9ba96e40e8wylcu,1970-04-23 22:54:06.789473684,0.157895,6.594607,10.63153,0.0,0.631579,2.473684,8.052632,111.105263,2.473684,19.24391,2068,0,0
9,12,880,8dac2b259fd1c6d1120e519fb1ac14fbqvax8,ewmzr,jewelry,phone220,9759248052631578,us,27.17.221.171,coaikfz4ebln9vg,a3d2de7675556553a5f08e4c88d2c2282ay1v,7f4c6ac489cbd95e38e4f093bb308af5jae25,1970-04-23 22:54:08.052631578,1.263158,6.594607,10.63153,0.0,0.631579,2.473684,8.052632,111.105263,2.473684,19.24391,2068,0,0


In [232]:
df_ordered = unordered_df.sort_values(by='index')
df_ordered.head(10)

Unnamed: 0,index,bid_id,bidder_id,auction,merchandise,device,time,country,ip,url,payment_account,address,date_time,time_delta_auction_bids,time_delta_auction_bids_mean,time_delta_auction_bids_std,time_delta_auction_bids_min,time_delta_auction_bids_25%,time_delta_auction_bids_50%,time_delta_auction_bids_75%,time_delta_auction_bids_max,time_delta_bids_in_auction_median,time_delta_bids_in_auction_kurtosis,total_bids_in_auction,first_auction_bid,last_auction_bid
0,0,0,8dac2b259fd1c6d1120e519fb1ac14fbqvax8,ewmzr,jewelry,phone0,9759243157894736,us,69.166.231.58,vasstdc27m7nks3,a3d2de7675556553a5f08e4c88d2c2282ay1v,7f4c6ac489cbd95e38e4f093bb308af5jae25,1970-04-23 22:54:03.157894736,0.0,6.594607,10.63153,0.0,0.631579,2.473684,8.052632,111.105263,2.473684,19.24391,2068,1,0
2068,1,14,8dac2b259fd1c6d1120e519fb1ac14fbqvax8,wberf,jewelry,phone15,9759243263157894,au,134.243.148.253,vasstdc27m7nks3,a3d2de7675556553a5f08e4c88d2c2282ay1v,7f4c6ac489cbd95e38e4f093bb308af5jae25,1970-04-23 22:54:03.263157894,0.0,4263.473684,4448.048902,1249.210526,1709.157895,2169.105263,5770.605263,9372.105263,2169.105263,,4,1,0
2072,2,106,8dac2b259fd1c6d1120e519fb1ac14fbqvax8,hw5at,jewelry,phone80,9759243736842105,ke,227.231.81.211,v2gyrh0dbr31atn,a3d2de7675556553a5f08e4c88d2c2282ay1v,7f4c6ac489cbd95e38e4f093bb308af5jae25,1970-04-23 22:54:03.736842105,0.0,48.986369,145.055987,0.052632,7.223684,19.105263,41.565789,2080.315789,19.105263,143.252999,279,1,0
2351,3,152,8dac2b259fd1c6d1120e519fb1ac14fbqvax8,uw3sx,jewelry,phone41,9759243947368421,iq,140.231.164.76,xdsfv4oevw5owkq,a3d2de7675556553a5f08e4c88d2c2282ay1v,7f4c6ac489cbd95e38e4f093bb308af5jae25,1970-04-23 22:54:03.947368421,0.0,9.655037,12.437212,0.0,2.052632,5.526316,12.736842,121.842105,5.526316,18.918137,1410,1,0
3761,4,155,8dac2b259fd1c6d1120e519fb1ac14fbqvax8,q79ya,jewelry,phone102,9759244000000000,za,187.81.242.103,eex5it5avrad6s8,a3d2de7675556553a5f08e4c88d2c2282ay1v,7f4c6ac489cbd95e38e4f093bb308af5jae25,1970-04-23 22:54:04.000000000,0.0,15.387376,35.667397,0.0,2.052632,6.473684,16.236842,477.368421,6.473684,98.942022,548,1,0
4309,5,169,8dac2b259fd1c6d1120e519fb1ac14fbqvax8,qcppg,jewelry,phone5,9759244052631578,in,13.136.161.106,vasstdc27m7nks3,a3d2de7675556553a5f08e4c88d2c2282ay1v,7f4c6ac489cbd95e38e4f093bb308af5jae25,1970-04-23 22:54:04.052631578,0.0,6.65199,14.990715,0.0,0.947368,2.473684,6.684211,375.578947,2.473684,200.810588,2051,1,0
6360,6,224,8dac2b259fd1c6d1120e519fb1ac14fbqvax8,fqfbw,jewelry,phone4,9759244368421052,in,153.47.226.142,vasstdc27m7nks3,a3d2de7675556553a5f08e4c88d2c2282ay1v,7f4c6ac489cbd95e38e4f093bb308af5jae25,1970-04-23 22:54:04.368421052,0.0,29.921745,44.757204,0.157895,5.815789,15.605263,35.842105,402.157895,15.605263,23.583485,305,1,0
6665,7,366,8dac2b259fd1c6d1120e519fb1ac14fbqvax8,idfc3,jewelry,phone4,9759245052631578,ke,207.97.126.108,vasstdc27m7nks3,a3d2de7675556553a5f08e4c88d2c2282ay1v,7f4c6ac489cbd95e38e4f093bb308af5jae25,1970-04-23 22:54:05.052631578,0.0,14.482801,32.58094,0.0,2.526316,6.210526,14.789474,590.526316,6.210526,136.969767,942,1,0
3,8,421,8dac2b259fd1c6d1120e519fb1ac14fbqvax8,ewmzr,jewelry,phone0,9759245368421052,us,69.166.231.58,vasstdc27m7nks3,a3d2de7675556553a5f08e4c88d2c2282ay1v,7f4c6ac489cbd95e38e4f093bb308af5jae25,1970-04-23 22:54:05.368421052,1.894737,6.594607,10.63153,0.0,0.631579,2.473684,8.052632,111.105263,2.473684,19.24391,2068,0,0
7607,9,422,8dac2b259fd1c6d1120e519fb1ac14fbqvax8,2yowp,jewelry,phone46,9759245368421052,iq,140.231.164.76,hsfvg8lforbluvq,a3d2de7675556553a5f08e4c88d2c2282ay1v,7f4c6ac489cbd95e38e4f093bb308af5jae25,1970-04-23 22:54:05.368421052,0.0,4.71595,6.187722,0.0,1.052632,2.736842,6.0,70.684211,2.736842,22.017629,2893,1,0


In [234]:
df_ordered.to_csv('dataset/auction_data_added_testing.csv', index=None)

In [235]:
df_test = pd.read_csv('dataset/auction_data_added_testing.csv')
df_test.head(10)

Unnamed: 0,index,bid_id,bidder_id,auction,merchandise,device,time,country,ip,url,payment_account,address,date_time,time_delta_auction_bids,time_delta_auction_bids_mean,time_delta_auction_bids_std,time_delta_auction_bids_min,time_delta_auction_bids_25%,time_delta_auction_bids_50%,time_delta_auction_bids_75%,time_delta_auction_bids_max,time_delta_bids_in_auction_median,time_delta_bids_in_auction_kurtosis,total_bids_in_auction,first_auction_bid,last_auction_bid
0,0,0,8dac2b259fd1c6d1120e519fb1ac14fbqvax8,ewmzr,jewelry,phone0,9759243157894736,us,69.166.231.58,vasstdc27m7nks3,a3d2de7675556553a5f08e4c88d2c2282ay1v,7f4c6ac489cbd95e38e4f093bb308af5jae25,1970-04-23 22:54:03.157894736,0.0,6.594607,10.63153,0.0,0.631579,2.473684,8.052632,111.105263,2.473684,19.24391,2068,1,0
1,1,14,8dac2b259fd1c6d1120e519fb1ac14fbqvax8,wberf,jewelry,phone15,9759243263157894,au,134.243.148.253,vasstdc27m7nks3,a3d2de7675556553a5f08e4c88d2c2282ay1v,7f4c6ac489cbd95e38e4f093bb308af5jae25,1970-04-23 22:54:03.263157894,0.0,4263.473684,4448.048902,1249.210526,1709.157895,2169.105263,5770.605263,9372.105263,2169.105263,,4,1,0
2,2,106,8dac2b259fd1c6d1120e519fb1ac14fbqvax8,hw5at,jewelry,phone80,9759243736842105,ke,227.231.81.211,v2gyrh0dbr31atn,a3d2de7675556553a5f08e4c88d2c2282ay1v,7f4c6ac489cbd95e38e4f093bb308af5jae25,1970-04-23 22:54:03.736842105,0.0,48.986369,145.055987,0.052632,7.223684,19.105263,41.565789,2080.315789,19.105263,143.252999,279,1,0
3,3,152,8dac2b259fd1c6d1120e519fb1ac14fbqvax8,uw3sx,jewelry,phone41,9759243947368421,iq,140.231.164.76,xdsfv4oevw5owkq,a3d2de7675556553a5f08e4c88d2c2282ay1v,7f4c6ac489cbd95e38e4f093bb308af5jae25,1970-04-23 22:54:03.947368421,0.0,9.655037,12.437212,0.0,2.052632,5.526316,12.736842,121.842105,5.526316,18.918137,1410,1,0
4,4,155,8dac2b259fd1c6d1120e519fb1ac14fbqvax8,q79ya,jewelry,phone102,9759244000000000,za,187.81.242.103,eex5it5avrad6s8,a3d2de7675556553a5f08e4c88d2c2282ay1v,7f4c6ac489cbd95e38e4f093bb308af5jae25,1970-04-23 22:54:04.000000000,0.0,15.387376,35.667397,0.0,2.052632,6.473684,16.236842,477.368421,6.473684,98.942022,548,1,0
5,5,169,8dac2b259fd1c6d1120e519fb1ac14fbqvax8,qcppg,jewelry,phone5,9759244052631578,in,13.136.161.106,vasstdc27m7nks3,a3d2de7675556553a5f08e4c88d2c2282ay1v,7f4c6ac489cbd95e38e4f093bb308af5jae25,1970-04-23 22:54:04.052631578,0.0,6.65199,14.990715,0.0,0.947368,2.473684,6.684211,375.578947,2.473684,200.810588,2051,1,0
6,6,224,8dac2b259fd1c6d1120e519fb1ac14fbqvax8,fqfbw,jewelry,phone4,9759244368421052,in,153.47.226.142,vasstdc27m7nks3,a3d2de7675556553a5f08e4c88d2c2282ay1v,7f4c6ac489cbd95e38e4f093bb308af5jae25,1970-04-23 22:54:04.368421052,0.0,29.921745,44.757204,0.157895,5.815789,15.605263,35.842105,402.157895,15.605263,23.583485,305,1,0
7,7,366,8dac2b259fd1c6d1120e519fb1ac14fbqvax8,idfc3,jewelry,phone4,9759245052631578,ke,207.97.126.108,vasstdc27m7nks3,a3d2de7675556553a5f08e4c88d2c2282ay1v,7f4c6ac489cbd95e38e4f093bb308af5jae25,1970-04-23 22:54:05.052631578,0.0,14.482801,32.58094,0.0,2.526316,6.210526,14.789474,590.526316,6.210526,136.969767,942,1,0
8,8,421,8dac2b259fd1c6d1120e519fb1ac14fbqvax8,ewmzr,jewelry,phone0,9759245368421052,us,69.166.231.58,vasstdc27m7nks3,a3d2de7675556553a5f08e4c88d2c2282ay1v,7f4c6ac489cbd95e38e4f093bb308af5jae25,1970-04-23 22:54:05.368421052,1.894737,6.594607,10.63153,0.0,0.631579,2.473684,8.052632,111.105263,2.473684,19.24391,2068,0,0
9,9,422,8dac2b259fd1c6d1120e519fb1ac14fbqvax8,2yowp,jewelry,phone46,9759245368421052,iq,140.231.164.76,hsfvg8lforbluvq,a3d2de7675556553a5f08e4c88d2c2282ay1v,7f4c6ac489cbd95e38e4f093bb308af5jae25,1970-04-23 22:54:05.368421052,0.0,4.71595,6.187722,0.0,1.052632,2.736842,6.0,70.684211,2.736842,22.017629,2893,1,0
