## **Big Data Project**: *NCAA Basketball*

[source](https://console.cloud.google.com/marketplace/product/ncaa-bb-public/ncaa-basketball?q=search&referrer=search&project=big-data-sports)

 | Table | Description |
 | ----------- | ----------- |
 | **mbb_games_sr** | Team-level box scores from every men's basketball game from the 2013-14 season to the 2017-18 season. Each row shows both teams' stats for that one game. Data provided by Sportradar LLC, see www.sportradar.com for more details. |
 | **mbb_players_games_sr** | Player-level box scores from every men's basketball game from the 2013-14 season to the 2017-18 season. Each row shows a single player's stats in one game. Data provided by Sportradar LLC, see www.sportradar.com for more details. |

---
---

In [43]:
import dask
import dask.dataframe as dd
from dask.distributed import Client, progress
import dask.array as da
from dask.diagnostics import Profiler, ResourceProfiler, CacheProfiler
import timeit

import pandas as pd
import numpy as np

#prefs
pd.set_option('max_columns', None)

### *Setting up a new dask connection*
---

In [44]:
#close existing dask connection if it exists and open a new one
try:
    if client is not None:
        client.close()
        print("closed existing connection, ",client)       
except Exception as e:
    print(e)
    

closed existing connection,  <Client: not connected>


In [45]:
#get new connection
client = Client(n_workers=2, threads_per_worker=2, memory_limit='8GB')
display(client)

0,1
Client  Scheduler: tcp://127.0.0.1:59726  Dashboard: http://127.0.0.1:8787/status,Cluster  Workers: 2  Cores: 4  Memory: 14.90 GiB


In [53]:
# first, pip install gcsfs
# games_data = dd.read_csv('gcs://sportsdata641/Datasets/mbb_games_sr')
games_data = dd.read_csv('gcs://sportsdata641/Datasets/mbb_games_sr', dtype={'a_assists': 'float64', 'a_blocked_att': 'float64','a_blocks': 'float64',\
                                                                             'a_coach_tech_fouls': 'float64','a_defensive_rebounds': 'float64',\
                                                                             'a_ejections': 'float64','a_field_goals_att': 'float64','a_field_goals_made': 'float64',\
                                                                             'a_flagrant_fouls': 'float64','a_free_throws_att': 'float64',\
                                                                             'a_free_throws_made': 'float64','a_offensive_rebounds': 'float64',\
                                                                             'a_personal_fouls': 'float64','a_player_tech_fouls': 'float64',\
                                                                             'a_points': 'float64','a_rebounds': 'float64',\
                                                                             'a_steals': 'float64','a_team_rebounds': 'float64','a_team_tech_fouls': 'float64',\
                                                                             'a_team_turnovers': 'float64','a_three_points_att': 'float64',\
                                                                             'a_three_points_made': 'float64','a_turnovers': 'float64','a_two_points_att': 'float64',\
                                                                             'a_two_points_made': 'float64','attendance': 'float64','h_assists': 'float64',\
                                                                             'h_blocked_att': 'float64','h_blocks': 'float64','h_coach_tech_fouls': 'float64',\
                                                                             'h_defensive_rebounds': 'float64','h_ejections': 'float64',\
                                                                             'h_field_goals_att': 'float64','h_field_goals_made': 'float64',\
                                                                             'h_flagrant_fouls': 'float64','h_free_throws_att': 'float64',\
                                                                             'h_free_throws_made': 'float64','h_offensive_rebounds': 'float64',\
                                                                             'h_personal_fouls': 'float64','h_player_tech_fouls': 'float64','h_points': 'float64',\
                                                                             'h_rebounds': 'float64','h_steals': 'float64','h_team_rebounds': 'float64',\
                                                                             'h_team_tech_fouls': 'float64','h_team_turnovers': 'float64',\
                                                                             'h_three_points_att': 'float64','h_three_points_made': 'float64',\
                                                                             'h_turnovers': 'float64','h_two_points_att': 'float64','h_two_points_made': 'float64',\
                                                                             'periods': 'float64','venue_capacity': 'float64','venue_zip': 'object'})

# Aggregating Play-by-play data for first half

In [5]:
pbp_data = dd.read_csv('gcs://sportsdata641/Datasets/mbb_pbp_sr*', usecols =['period','game_id','team_id','home_id','away_id','event_type','event_description'],\
                      dtype={'team_id':object})

In [6]:
#Filtering out non-team events (e.g., official timeouts) and events from the second half
pbp_data2=pbp_data[(pbp_data["team_id"].notnull())&(pbp_data["period"]==1)]

In [7]:
pbp_data2.head()

Unnamed: 0,game_id,away_id,home_id,period,team_id,event_description,event_type
19141,063879c7-2bae-473f-aa3f-8a68f444bb73,9c7f3b90-ec9f-4a30-9ade-e0bcb8c8835e,532d3874-b4b3-4c5c-acc6-749a6db26c8f,1,9c7f3b90-ec9f-4a30-9ade-e0bcb8c8835e,Omar Richard turnover (traveling),turnover
19142,063879c7-2bae-473f-aa3f-8a68f444bb73,9c7f3b90-ec9f-4a30-9ade-e0bcb8c8835e,532d3874-b4b3-4c5c-acc6-749a6db26c8f,1,9c7f3b90-ec9f-4a30-9ade-e0bcb8c8835e,Omar Richard misses free throw 1 of 2,freethrowmiss
19143,063879c7-2bae-473f-aa3f-8a68f444bb73,9c7f3b90-ec9f-4a30-9ade-e0bcb8c8835e,532d3874-b4b3-4c5c-acc6-749a6db26c8f,1,9c7f3b90-ec9f-4a30-9ade-e0bcb8c8835e,Jay Mayernik misses two point layup,twopointmiss
19145,063879c7-2bae-473f-aa3f-8a68f444bb73,9c7f3b90-ec9f-4a30-9ade-e0bcb8c8835e,532d3874-b4b3-4c5c-acc6-749a6db26c8f,1,9c7f3b90-ec9f-4a30-9ade-e0bcb8c8835e,Jay Mayernik makes two point layup,twopointmade
19150,063879c7-2bae-473f-aa3f-8a68f444bb73,9c7f3b90-ec9f-4a30-9ade-e0bcb8c8835e,532d3874-b4b3-4c5c-acc6-749a6db26c8f,1,9c7f3b90-ec9f-4a30-9ade-e0bcb8c8835e,Javonte Byrd misses two point layup,twopointmiss


In [8]:
#pbp_data2.compute()
#1852059 rows is about 10k+ games, assuming about 170 first half plays per game

Note: event_type definitions can be found here: https://developer.sportradar.com/docs/basketball/NCAA_Mens_Basketball_v7#frequently-asked-questions

In [9]:
pbp_data2["2PA"]=(pbp_data2["event_type"].isin(["twopointmade","twopointmiss"]))
pbp_data2["2PM"]=(pbp_data2["event_type"]=="twopointmade")
pbp_data2["3PA"]=(pbp_data2["event_type"]=="threepointmade")|(pbp_data2["event_type"]=="threepointmiss")
pbp_data2["3PM"]=(pbp_data2["event_type"]=="threepointmade")
pbp_data2["FTA"]=(pbp_data2["event_type"]=="freethrowmade")|(pbp_data2["event_type"]=="freethrowmiss")
pbp_data2["FTM"]=(pbp_data2["event_type"]=="freethrowmade")
pbp_data2["TRB"]=(pbp_data2["event_type"]=="rebound")
pbp_data2["TO"]=(pbp_data2["event_type"]=="turnover")
pbp_data2["Foul"]=(pbp_data2["event_type"].isin(["flagrantone","flagranttwo","clearpathfoul","technicalfoul",\
                                                "minortechnicalfoul","personalfoul","defensivethreeseconds"]))
pbp_data2["Flagrant"]=(pbp_data2["event_type"].isin(["flagrantone","flagranttwo"]))
pbp_data2["Ejection"]=(pbp_data2["event_type"]=="ejection")


In [10]:
#pbp_data2.compute()

In [11]:
def checkast(row):
    if row["event_type"] in ["twopointmade","threepointmade"]:
        return "assist" in row["event_description"]
    else:
        return False


pbp_data2["AST"] =pbp_data2.apply(checkast,axis=1)

You did not provide metadata, so Dask is running your function on a small dataset to guess output types. It is possible that Dask will guess incorrectly.
To provide an explicit output types or to silence this message, please provide the `meta=` keyword, as described in the map or apply function that you are using.
  Before: .apply(func)
  After:  .apply(func, meta=(None, 'bool'))



In [12]:
def checkstl(row):
    if row["event_type"] == "turnover":
        return "steal" in row["event_description"]
    else:
        return False
    
pbp_data2["STLA"] =pbp_data2.apply(checkstl,axis=1)

def checkblk(row):
    if row["event_type"] in ["twopointmiss","threepointmiss"]:
        return "block" in row["event_description"]
    else:
        return False
pbp_data2["BLKA"] = pbp_data2.apply(checkblk,axis=1)


In [13]:
pbp_data2.head()

Unnamed: 0,game_id,away_id,home_id,period,team_id,event_description,event_type,2PA,2PM,3PA,3PM,FTA,FTM,TRB,TO,Foul,Flagrant,Ejection,AST,STLA,BLKA
19141,063879c7-2bae-473f-aa3f-8a68f444bb73,9c7f3b90-ec9f-4a30-9ade-e0bcb8c8835e,532d3874-b4b3-4c5c-acc6-749a6db26c8f,1,9c7f3b90-ec9f-4a30-9ade-e0bcb8c8835e,Omar Richard turnover (traveling),turnover,False,False,False,False,False,False,False,True,False,False,False,False,False,False
19142,063879c7-2bae-473f-aa3f-8a68f444bb73,9c7f3b90-ec9f-4a30-9ade-e0bcb8c8835e,532d3874-b4b3-4c5c-acc6-749a6db26c8f,1,9c7f3b90-ec9f-4a30-9ade-e0bcb8c8835e,Omar Richard misses free throw 1 of 2,freethrowmiss,False,False,False,False,True,False,False,False,False,False,False,False,False,False
19143,063879c7-2bae-473f-aa3f-8a68f444bb73,9c7f3b90-ec9f-4a30-9ade-e0bcb8c8835e,532d3874-b4b3-4c5c-acc6-749a6db26c8f,1,9c7f3b90-ec9f-4a30-9ade-e0bcb8c8835e,Jay Mayernik misses two point layup,twopointmiss,True,False,False,False,False,False,False,False,False,False,False,False,False,False
19145,063879c7-2bae-473f-aa3f-8a68f444bb73,9c7f3b90-ec9f-4a30-9ade-e0bcb8c8835e,532d3874-b4b3-4c5c-acc6-749a6db26c8f,1,9c7f3b90-ec9f-4a30-9ade-e0bcb8c8835e,Jay Mayernik makes two point layup,twopointmade,True,True,False,False,False,False,False,False,False,False,False,False,False,False
19150,063879c7-2bae-473f-aa3f-8a68f444bb73,9c7f3b90-ec9f-4a30-9ade-e0bcb8c8835e,532d3874-b4b3-4c5c-acc6-749a6db26c8f,1,9c7f3b90-ec9f-4a30-9ade-e0bcb8c8835e,Javonte Byrd misses two point layup,twopointmiss,True,False,False,False,False,False,False,False,False,False,False,False,False,False


In [14]:
pbp_data2[(pbp_data2["BLKA"])].head()

Unnamed: 0,game_id,away_id,home_id,period,team_id,event_description,event_type,2PA,2PM,3PA,3PM,FTA,FTM,TRB,TO,Foul,Flagrant,Ejection,AST,STLA,BLKA
19956,054771c4-3908-4486-b46a-104d50135101,c10544de-e3bd-4776-ba2e-83df8c017fd1,4383eb6a-7fd8-4ff2-94c5-43c933121e88,1,4383eb6a-7fd8-4ff2-94c5-43c933121e88,Jarrod Uthoff blocks JayVaughn Pinkston's two ...,twopointmiss,True,False,False,False,False,False,False,False,False,False,False,False,False,True
20067,5be9a30e-3582-465d-b19e-5388eddbacd5,0d8a328f-20ce-410b-bed1-15fc01308aaf,3a000455-de7c-4ca8-880e-abdce7f21da9,1,0d8a328f-20ce-410b-bed1-15fc01308aaf,D.J. Haley blocks Myles Davis's two point shot,twopointmiss,True,False,False,False,False,False,False,False,False,False,False,False,False,True
20126,63d257d7-4865-49d1-afd1-fd4ca560bbd5,c10544de-e3bd-4776-ba2e-83df8c017fd1,06d15d35-4955-4fdd-83d9-32d24dbd795b,1,06d15d35-4955-4fdd-83d9-32d24dbd795b,Aaron White blocks Cedrick Lang's two point shot,twopointmiss,True,False,False,False,False,False,False,False,False,False,False,False,False,True
20137,679a305f-2359-4e0f-97ca-3d886ca3d1c3,b827dbdf-230f-4916-9703-3bb9004e26eb,4fbebf0a-e117-4a0c-8f15-c247535a2a1b,1,4fbebf0a-e117-4a0c-8f15-c247535a2a1b,Robert Hubbs III blocks Devin Thomas's two poi...,twopointmiss,True,False,False,False,False,False,False,False,False,False,False,False,False,True
20178,7bee62f8-1a9f-4ab9-896c-9200ef45eea8,06d15d35-4955-4fdd-83d9-32d24dbd795b,fae4855b-1b64-4b40-a632-9ed345e1e952,1,fae4855b-1b64-4b40-a632-9ed345e1e952,John Bohannon blocks Tarik Black's two point shot,twopointmiss,True,False,False,False,False,False,False,False,False,False,False,False,False,True


In [15]:
pbp_data3 = pbp_data2.groupby(["game_id","team_id"]).agg({'2PA':'sum','2PM':'sum','3PA':'sum','3PM':'sum','FTA':'sum',\
                                                         'FTM':'sum','TRB':'sum','TO':'sum','Foul':'sum','Flagrant':'sum',\
                                                         'Ejection':'sum','AST':'sum','STLA':'sum','BLKA':'sum'})

In [16]:
agg_data = pbp_data3.compute()

In [17]:
#agg_data["PTS"] = 2*agg_data["2PM"]+3*agg_data["3PM"]+agg_data["FTM"]

In [18]:
display(agg_data)

Unnamed: 0_level_0,Unnamed: 1_level_0,2PA,2PM,3PA,3PM,FTA,FTM,TRB,TO,Foul,Flagrant,Ejection,AST,STLA,BLKA
game_id,team_id,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1
000872e5-f02a-4b64-ac73-b6b1a7ad10ec,4f4b0771-994c-4126-822d-7525aaa00f65,17,7,6,1,14,10,21,7,8,0,0,2,5,1
000872e5-f02a-4b64-ac73-b6b1a7ad10ec,912f8837-1d81-4ef9-a576-a21f271d4c64,15,3,16,7,9,7,19,7,9,0,0,5,5,2
000918c3-b8bf-472a-9a12-94a1984700eb,1551b3a0-6d10-4ffa-8dfa-73b56f004553,25,11,4,3,9,6,19,12,6,0,0,10,7,1
000918c3-b8bf-472a-9a12-94a1984700eb,b795ddbc-baab-4499-8803-52e8608520ab,19,9,8,2,12,7,17,12,3,0,0,8,7,4
000b3698-3ce9-44bd-954b-65703a2c6ef1,4f4b0771-994c-4126-822d-7525aaa00f65,22,8,9,1,12,9,27,13,3,0,0,3,9,1
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
daec9de3-4a8a-4125-8978-a38e1fd18264,dfe0d93f-94a5-47fb-b7aa-f74786e09acb,22,5,10,3,8,7,24,12,8,0,0,3,4,3
db626521-110e-443b-83a8-00ae1aaa5a28,61a3908a-7492-4b6f-809e-12c61976bb0a,18,11,9,4,2,2,18,9,8,0,0,8,6,1
db626521-110e-443b-83a8-00ae1aaa5a28,d203f38a-a166-4258-bca2-e161b591ecfb,18,8,9,2,3,2,11,5,6,0,0,4,2,2
f1063e80-23c7-486b-9a5e-faa52beb2d83,4383eb6a-7fd8-4ff2-94c5-43c933121e88,18,10,13,4,6,5,22,7,2,0,0,3,4,1


# Merging aggregated first half data to game data:
Plan: 
1) Compute pandas dataframe g_data
2) Merge agg_data to g_data using game_id and team_id to game_id and h_id, prefix with h
3) Merge agg_data to g_data using game_id and team_id to game_id and a_id, prefix with a

In [19]:
g_data = games_data.compute()
display(g_data)



Unnamed: 0,game_id,season,status,coverage,neutral_site,scheduled_date,gametime,conference_game,tournament,tournament_type,tournament_round,tournament_game_no,attendance,lead_changes,times_tied,periods,possession_arrow,venue_id,venue_city,venue_state,venue_address,venue_zip,venue_country,venue_name,venue_capacity,h_name,h_market,h_id,h_alias,h_league_id,h_league_name,h_league_alias,h_conf_id,h_conf_name,h_conf_alias,h_division_id,h_division_name,h_division_alias,h_logo_large,h_logo_medium,h_logo_small,h_points_game,h_rank,h_minutes,h_field_goals_made,h_field_goals_att,h_field_goals_pct,h_three_points_made,h_three_points_att,h_three_points_pct,h_two_points_made,h_two_points_att,h_two_points_pct,h_blocked_att,h_free_throws_made,h_free_throws_att,h_free_throws_pct,h_offensive_rebounds,h_defensive_rebounds,h_rebounds,h_assists,h_turnovers,h_steals,h_blocks,h_assists_turnover_ratio,h_personal_fouls,h_ejections,h_foulouts,h_points,h_fast_break_pts,h_second_chance_pts,h_team_turnovers,h_points_off_turnovers,h_team_rebounds,h_flagrant_fouls,h_player_tech_fouls,h_team_tech_fouls,h_coach_tech_fouls,a_name,a_market,a_id,a_alias,a_league_id,a_league_name,a_league_alias,a_conf_id,a_conf_name,a_conf_alias,a_division_id,a_division_name,a_division_alias,a_logo_large,a_logo_medium,a_logo_small,a_points_game,a_rank,a_minutes,a_field_goals_made,a_field_goals_att,a_field_goals_pct,a_three_points_made,a_three_points_att,a_three_points_pct,a_two_points_made,a_two_points_att,a_two_points_pct,a_blocked_att,a_free_throws_made,a_free_throws_att,a_free_throws_pct,a_offensive_rebounds,a_defensive_rebounds,a_rebounds,a_assists,a_turnovers,a_steals,a_blocks,a_assists_turnover_ratio,a_personal_fouls,a_ejections,a_foulouts,a_points,a_fast_break_pts,a_second_chance_pts,a_team_turnovers,a_points_off_turnovers,a_team_rebounds,a_flagrant_fouls,a_player_tech_fouls,a_team_tech_fouls,a_coach_tech_fouls,created
0,b4451a02-26c5-4005-9ac8-b06c1f71e661,2015,closed,full,,2015-11-24,2015-11-24 21:30:00 UTC,,,,,,2400.0,3.0,2.0,2.0,68a3227f-677f-43b0-9a3a-cad79d0df9e2,c69e13a7-4637-4b0e-9ca8-043ac5738a9d,Maui,HI,1840 Honoapiilani Hwy,96761,USA,Lahaina Civic Center,2400.0,Silverswords,Chaminade University,ef13a371-76ed-409c-9aa6-35135183e170,CHA,cd4268ee-07aa-4c4d-a435-ec44ad2c76cb,NCAA MEN,NCAAM,ff8025b4-2752-413b-a6fe-4a5c36c47bab,Pacific West Conference,PACWEST-D2,9c6f6fe5-c9a1-4260-8d87-f9866ca271ba,NCAA Division II,D2,,,,73,0,3:20:00,26.0,61.0,42.6,10.0,19.0,52.6,16.0,42.0,0.381,7.0,11.0,16.0,68.8,6.0,26.0,32.0,17.0,22.0,6.0,2.0,0.77,25.0,0.0,,73.0,14.0,3.0,0.0,19.0,2.0,0.0,0.0,0.0,0.0,Rebels,UNLV,68a3227f-677f-43b0-9a3a-cad79d0df9e2,UNLV,cd4268ee-07aa-4c4d-a435-ec44ad2c76cb,NCAA MEN,NCAAM,93a776e4-d390-48e1-95bb-74945457366a,Mountain West,MWC,c5a8d640-5093-4044-851d-2c562e929994,NCAA Division I,D1,https://www.ncaa.com/sites/default/files/image...,https://www.ncaa.com/sites/default/files/image...,https://www.ncaa.com/sites/default/files/image...,93,0,3:20:00,37.0,76.0,48.7,4.0,16.0,25.0,33.0,60.0,0.550,2.0,15.0,30.0,50.0,16.0,29.0,45.0,15.0,10.0,16.0,7.0,1.50,17.0,0.0,,93.0,36.0,17.0,0.0,31.0,5.0,0.0,0.0,0.0,0.0,2018-02-20 15:48:58 UTC
1,b2f579ca-9eff-4b2b-a747-81169399c2e8,2015,closed,full,,2015-11-24,2015-11-24 02:00:00 UTC,,,,,,2400.0,1.0,0.0,2.0,fae4855b-1b64-4b40-a632-9ed345e1e952,c69e13a7-4637-4b0e-9ca8-043ac5738a9d,Maui,HI,1840 Honoapiilani Hwy,96761,USA,Lahaina Civic Center,2400.0,Silverswords,Chaminade University,ef13a371-76ed-409c-9aa6-35135183e170,CHA,cd4268ee-07aa-4c4d-a435-ec44ad2c76cb,NCAA MEN,NCAAM,ff8025b4-2752-413b-a6fe-4a5c36c47bab,Pacific West Conference,PACWEST-D2,9c6f6fe5-c9a1-4260-8d87-f9866ca271ba,NCAA Division II,D2,,,,72,0,3:20:00,24.0,69.0,34.8,8.0,33.0,24.2,16.0,36.0,0.444,7.0,16.0,21.0,76.2,9.0,13.0,22.0,10.0,14.0,7.0,1.0,0.71,21.0,0.0,,72.0,6.0,13.0,0.0,9.0,4.0,0.0,0.0,0.0,0.0,Jayhawks,Kansas,fae4855b-1b64-4b40-a632-9ed345e1e952,KU,cd4268ee-07aa-4c4d-a435-ec44ad2c76cb,NCAA MEN,NCAAM,2853cf4d-6d62-4ec6-8e2c-d69f7a01a557,Big 12,BIG12,c5a8d640-5093-4044-851d-2c562e929994,NCAA Division I,D1,https://www.ncaa.com/sites/default/files/image...,https://www.ncaa.com/sites/default/files/image...,https://www.ncaa.com/sites/default/files/image...,123,5,3:20:00,47.0,73.0,64.4,15.0,29.0,51.7,32.0,44.0,0.727,1.0,14.0,20.0,70.0,13.0,37.0,50.0,32.0,14.0,9.0,7.0,2.29,17.0,0.0,,123.0,16.0,25.0,0.0,25.0,1.0,0.0,0.0,0.0,0.0,2018-02-20 15:48:53 UTC
2,571be71c-a5bf-446e-bf21-30eb6c54ac5e,2015,closed,full,,2015-11-25,2015-11-25 19:30:00 UTC,,,,,,2400.0,2.0,0.0,2.0,ef13a371-76ed-409c-9aa6-35135183e170,c69e13a7-4637-4b0e-9ca8-043ac5738a9d,Maui,HI,1840 Honoapiilani Hwy,96761,USA,Lahaina Civic Center,2400.0,Silverswords,Chaminade University,ef13a371-76ed-409c-9aa6-35135183e170,CHA,cd4268ee-07aa-4c4d-a435-ec44ad2c76cb,NCAA MEN,NCAAM,ff8025b4-2752-413b-a6fe-4a5c36c47bab,Pacific West Conference,PACWEST-D2,9c6f6fe5-c9a1-4260-8d87-f9866ca271ba,NCAA Division II,D2,,,,93,0,3:20:00,34.0,67.0,50.7,13.0,29.0,44.8,21.0,38.0,0.553,5.0,12.0,20.0,60.0,7.0,17.0,24.0,19.0,12.0,8.0,0.0,1.58,17.0,0.0,,93.0,6.0,11.0,0.0,32.0,4.0,0.0,0.0,0.0,0.0,Red Storm,St. John's,c1f4aae1-aa16-4095-aeab-10e5c2a1236a,SJU,cd4268ee-07aa-4c4d-a435-ec44ad2c76cb,NCAA MEN,NCAAM,d07bc93e-c84c-44a9-a99d-c213bd0014d6,Big East,BIGEAST,c5a8d640-5093-4044-851d-2c562e929994,NCAA Division I,D1,https://www.ncaa.com/sites/default/files/image...,https://www.ncaa.com/sites/default/files/image...,https://www.ncaa.com/sites/default/files/image...,100,0,3:20:00,35.0,59.0,59.3,10.0,19.0,52.6,25.0,40.0,0.625,0.0,20.0,27.0,74.1,8.0,25.0,33.0,21.0,17.0,7.0,5.0,1.24,19.0,0.0,,100.0,6.0,6.0,0.0,12.0,0.0,0.0,0.0,0.0,0.0,2018-02-20 15:48:58 UTC
3,d6617923-0b23-49e4-af9b-9e4d0243e45c,2015,closed,full,,2015-12-19,2015-12-19 04:00:00 UTC,,,,,,8032.0,9.0,1.0,2.0,532d3874-b4b3-4c5c-acc6-749a6db26c8f,1d1f74a2-7b35-56f0-8cbd-552c51cb2c14,Portland,OR,1 Center Court,97227,USA,Moda Center,19441.0,Beavers,Oregon State,532d3874-b4b3-4c5c-acc6-749a6db26c8f,ORST,cd4268ee-07aa-4c4d-a435-ec44ad2c76cb,NCAA MEN,NCAAM,04d5255d-b2dc-43df-9fa8-d296b0f8ccd7,Pacific 12,PAC12,c5a8d640-5093-4044-851d-2c562e929994,NCAA Division I,D1,https://www.ncaa.com/sites/default/files/image...,https://www.ncaa.com/sites/default/files/image...,https://www.ncaa.com/sites/default/files/image...,82,0,3:20:00,26.0,54.0,48.1,8.0,20.0,40.0,18.0,34.0,0.529,0.0,22.0,29.0,75.9,10.0,25.0,35.0,14.0,11.0,2.0,2.0,1.27,20.0,0.0,,82.0,4.0,10.0,0.0,16.0,3.0,0.0,0.0,0.0,0.0,Titans,Cal State Fullerton,c009914b-3303-4dee-b915-978aa48a31d0,CSF,cd4268ee-07aa-4c4d-a435-ec44ad2c76cb,NCAA MEN,NCAAM,5f56da49-5d81-43c3-8652-8b8da40c907f,Big West,BIGWEST,c5a8d640-5093-4044-851d-2c562e929994,NCAA Division I,D1,https://www.ncaa.com/sites/default/files/image...,https://www.ncaa.com/sites/default/files/image...,https://www.ncaa.com/sites/default/files/image...,69,0,3:20:00,22.0,52.0,42.3,9.0,23.0,39.1,13.0,29.0,0.448,2.0,16.0,29.0,55.2,8.0,21.0,29.0,10.0,10.0,3.0,0.0,1.00,23.0,0.0,,69.0,2.0,13.0,1.0,15.0,3.0,0.0,0.0,0.0,0.0,2018-02-20 15:48:53 UTC
4,ffb463a4-dd3c-4ed9-b503-311b95ef0295,2015,closed,full,,2015-12-20,2015-12-20 04:00:00 UTC,,,,,,8555.0,1.0,3.0,2.0,2959bd24-7007-41ae-a3a3-abdf26888cfc,1d1f74a2-7b35-56f0-8cbd-552c51cb2c14,Portland,OR,1 Center Court,97227,USA,Moda Center,19441.0,Beavers,Oregon State,532d3874-b4b3-4c5c-acc6-749a6db26c8f,ORST,cd4268ee-07aa-4c4d-a435-ec44ad2c76cb,NCAA MEN,NCAAM,04d5255d-b2dc-43df-9fa8-d296b0f8ccd7,Pacific 12,PAC12,c5a8d640-5093-4044-851d-2c562e929994,NCAA Division I,D1,https://www.ncaa.com/sites/default/files/image...,https://www.ncaa.com/sites/default/files/image...,https://www.ncaa.com/sites/default/files/image...,76,0,3:20:00,22.0,54.0,40.7,7.0,18.0,38.9,15.0,36.0,0.417,3.0,25.0,31.0,80.6,11.0,25.0,36.0,12.0,12.0,6.0,3.0,1.00,21.0,0.0,,76.0,4.0,7.0,0.0,9.0,2.0,0.0,0.0,0.0,0.0,Golden Hurricane,Tulsa,2959bd24-7007-41ae-a3a3-abdf26888cfc,TLSA,cd4268ee-07aa-4c4d-a435-ec44ad2c76cb,NCAA MEN,NCAAM,3b6a48d8-1f9c-484f-8ed0-ef0a540a0efe,American Athletic,AAC,c5a8d640-5093-4044-851d-2c562e929994,NCAA Division I,D1,https://www.ncaa.com/sites/default/files/image...,https://www.ncaa.com/sites/default/files/image...,https://www.ncaa.com/sites/default/files/image...,71,0,3:20:00,24.0,53.0,45.3,5.0,17.0,29.4,19.0,36.0,0.528,3.0,18.0,28.0,64.3,10.0,22.0,32.0,14.0,13.0,6.0,3.0,1.08,23.0,0.0,,71.0,6.0,7.0,0.0,,0.0,0.0,0.0,0.0,0.0,2018-02-20 15:48:53 UTC
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
29800,19be97d9-1756-41ac-a00f-e08c3ea5998a,2016,closed,extended_boxscore,1.0,2016-12-23,2016-12-23 20:00:00 UTC,False,,,,,0.0,0.0,0.0,2.0,,7b49816c-cac2-40d5-97bc-7c8c0935039d,Las Vegas,NV,4500 W. Tropicana Ave,89103,USA,Orleans Arena,7471.0,Big Red,Cornell,88ff8c00-958e-4ccf-a21d-77fab9e93692,COR,cd4268ee-07aa-4c4d-a435-ec44ad2c76cb,NCAA MEN,NCAAM,c2d16439-b791-4f9b-84d9-80cf457a0676,Ivy,IVY,c5a8d640-5093-4044-851d-2c562e929994,NCAA Division I,D1,https://www.ncaa.com/sites/default/files/image...,https://www.ncaa.com/sites/default/files/image...,https://www.ncaa.com/sites/default/files/image...,78,0,3:20:00,29.0,56.0,51.8,10.0,27.0,37.0,19.0,29.0,65.517,0.0,10.0,13.0,76.9,3.0,33.0,36.0,19.0,15.0,3.0,3.0,1.27,18.0,0.0,0.0,78.0,8.0,0.0,0.0,13.0,5.0,0.0,0.0,,,Redhawks,Southeast Missouri State,6a7083ab-1832-48c0-9168-427b35adbcde,SEMO,cd4268ee-07aa-4c4d-a435-ec44ad2c76cb,NCAA MEN,NCAAM,0f3991a1-8c5f-4a8e-8fab-d0ebbb21c35c,Ohio Valley,OVC,c5a8d640-5093-4044-851d-2c562e929994,NCAA Division I,D1,https://www.ncaa.com/sites/default/files/image...,https://www.ncaa.com/sites/default/files/image...,https://www.ncaa.com/sites/default/files/image...,62,0,3:20:00,18.0,58.0,31.0,9.0,27.0,33.3,9.0,31.0,29.032,0.0,17.0,21.0,81.0,5.0,21.0,26.0,7.0,8.0,6.0,0.0,0.88,14.0,0.0,0.0,62.0,0.0,4.0,0.0,17.0,3.0,0.0,0.0,,,2018-02-20 16:40:02 UTC
29801,ff822d88-b370-429a-bc3c-dcd7e45b6560,2016,closed,extended_boxscore,1.0,2016-12-22,2016-12-22 22:30:00 UTC,False,,,,,4148.0,1.0,3.0,2.0,,7b49816c-cac2-40d5-97bc-7c8c0935039d,Las Vegas,NV,4500 W. Tropicana Ave,89103,USA,Orleans Arena,7471.0,Big Red,Cornell,88ff8c00-958e-4ccf-a21d-77fab9e93692,COR,cd4268ee-07aa-4c4d-a435-ec44ad2c76cb,NCAA MEN,NCAAM,c2d16439-b791-4f9b-84d9-80cf457a0676,Ivy,IVY,c5a8d640-5093-4044-851d-2c562e929994,NCAA Division I,D1,https://www.ncaa.com/sites/default/files/image...,https://www.ncaa.com/sites/default/files/image...,https://www.ncaa.com/sites/default/files/image...,84,0,3:20:00,29.0,64.0,45.3,16.0,38.0,42.1,13.0,26.0,50.000,0.0,10.0,18.0,55.6,7.0,23.0,30.0,18.0,13.0,2.0,3.0,1.38,26.0,0.0,0.0,84.0,0.0,10.0,1.0,4.0,6.0,0.0,0.0,,,Trojans,Troy,6373b18c-62f6-49bc-bd4c-8959a2466516,TROY,cd4268ee-07aa-4c4d-a435-ec44ad2c76cb,NCAA MEN,NCAAM,302c99fe-6b0a-40ec-8ee7-f15a0355b7b5,Sun Belt,SUNBELT,c5a8d640-5093-4044-851d-2c562e929994,NCAA Division I,D1,https://www.ncaa.com/sites/default/files/image...,https://www.ncaa.com/sites/default/files/image...,https://www.ncaa.com/sites/default/files/image...,92,0,3:20:00,30.0,63.0,47.6,6.0,21.0,28.6,24.0,42.0,57.143,0.0,26.0,33.0,78.8,10.0,27.0,37.0,14.0,8.0,9.0,5.0,1.75,17.0,0.0,0.0,92.0,4.0,16.0,0.0,20.0,3.0,0.0,0.0,,,2018-02-20 16:40:00 UTC
29802,c1f96ff1-b0c2-49eb-9192-803bab3fe1ae,2016,closed,extended_boxscore,1.0,2016-12-23,2016-12-23 01:30:00 UTC,False,,,,,,4.0,5.0,2.0,,7b49816c-cac2-40d5-97bc-7c8c0935039d,Las Vegas,NV,4500 W. Tropicana Ave,89103,USA,Orleans Arena,7471.0,Blue Demons,DePaul,ee09e6ad-3872-4745-bbb9-ebbd5c6f8318,DEP,cd4268ee-07aa-4c4d-a435-ec44ad2c76cb,NCAA MEN,NCAAM,d07bc93e-c84c-44a9-a99d-c213bd0014d6,Big East,BIGEAST,c5a8d640-5093-4044-851d-2c562e929994,NCAA Division I,D1,https://www.ncaa.com/sites/default/files/image...,https://www.ncaa.com/sites/default/files/image...,https://www.ncaa.com/sites/default/files/image...,58,0,3:20:00,20.0,71.0,28.2,4.0,15.0,26.7,16.0,56.0,28.571,0.0,14.0,20.0,70.0,11.0,21.0,32.0,5.0,14.0,11.0,2.0,0.36,21.0,0.0,0.0,58.0,2.0,9.0,0.0,19.0,7.0,0.0,0.0,,,Cowboys,Wyoming,a7127c0a-a466-47ae-91ad-9a71ee2c9427,WYO,cd4268ee-07aa-4c4d-a435-ec44ad2c76cb,NCAA MEN,NCAAM,93a776e4-d390-48e1-95bb-74945457366a,Mountain West,MWC,c5a8d640-5093-4044-851d-2c562e929994,NCAA Division I,D1,https://www.ncaa.com/sites/default/files/image...,https://www.ncaa.com/sites/default/files/image...,https://www.ncaa.com/sites/default/files/image...,72,0,3:20:00,24.0,57.0,42.1,6.0,25.0,24.0,18.0,32.0,56.250,0.0,18.0,22.0,81.8,8.0,36.0,44.0,12.0,22.0,4.0,6.0,0.55,18.0,0.0,0.0,72.0,15.0,6.0,0.0,12.0,5.0,0.0,0.0,,,2018-02-20 16:39:59 UTC
29803,3850e646-a7b2-49f1-9446-407249f9e64a,2017,closed,extended_boxscore,1.0,2017-12-23,2017-12-23 01:30:00 UTC,False,,,,,,9.0,3.0,2.0,,7b49816c-cac2-40d5-97bc-7c8c0935039d,Las Vegas,NV,4500 W Tropicana Ave,89103,USA,Orleans Arena,9500.0,Dukes,Duquesne,fea46ac5-6dad-43cd-a770-75554dbcc118,DUQ,cd4268ee-07aa-4c4d-a435-ec44ad2c76cb,NCAA MEN,NCAAM,db136c00-f45b-4af6-bc7d-ffff216f2e5d,Atlantic 10,A10,c5a8d640-5093-4044-851d-2c562e929994,NCAA Division I,D1,https://www.ncaa.com/sites/default/files/image...,https://www.ncaa.com/sites/default/files/image...,https://www.ncaa.com/sites/default/files/image...,67,0,3:20:00,23.0,52.0,44.2,8.0,16.0,50.0,15.0,36.0,41.700,0.0,13.0,18.0,72.2,6.0,21.0,27.0,9.0,14.0,7.0,5.0,0.64,19.0,0.0,0.0,67.0,10.0,6.0,2.0,17.0,4.0,0.0,0.0,,,Dons,San Francisco,d24efd99-8717-43b9-a086-9986a684ac04,SF,cd4268ee-07aa-4c4d-a435-ec44ad2c76cb,NCAA MEN,NCAAM,c664ceee-1dc0-4743-a6d8-11fbdfb87f61,West Coast,WCC,c5a8d640-5093-4044-851d-2c562e929994,NCAA Division I,D1,https://www.ncaa.com/sites/default/files/image...,https://www.ncaa.com/sites/default/files/image...,https://www.ncaa.com/sites/default/files/image...,65,0,3:20:00,25.0,54.0,46.3,5.0,13.0,38.5,20.0,41.0,48.800,0.0,10.0,13.0,76.9,5.0,21.0,26.0,14.0,14.0,2.0,4.0,1.00,19.0,0.0,0.0,65.0,3.0,3.0,0.0,17.0,4.0,0.0,0.0,,,2018-02-20 13:03:21 UTC


In [20]:
# Margin of Victory column
games_data['MOV'] = games_data['h_points_game']-games_data['a_points_game']
print("--------")
display(games_data['MOV'])
print("--------")
display(games_data.compute()['MOV'])

--------


Dask Series Structure:
npartitions=1
    int64
      ...
Name: MOV, dtype: int64
Dask Name: getitem, 6 tasks

--------


0       -20
1       -51
2        -7
3        13
4         5
         ..
29800    16
29801    -8
29802   -14
29803     2
29804    14
Name: MOV, Length: 29805, dtype: int64

In [21]:
feature_subset = ['game_id','h_id','a_id','season','conference_game','tournament','tournament_type',\
                 'tournament_round','tournament_game_no','attendance','venue_id','venue_city','venue_state',\
                 'venue_address','venue_zip','venue_capacity','MOV',\
                 'h_market','h_conf_id','h_conf_name','h_division_alias','h_points_game',\
                 'a_market','a_conf_id','a_conf_name','a_division_alias','a_points_game']

In [22]:
g_data = games_data[feature_subset].compute()

In [23]:
g_data2 = g_data.merge(agg_data.add_prefix('h_'),how='inner',left_on=['game_id','h_id'],right_on=['game_id','team_id'])
display(g_data2)

Unnamed: 0,game_id,h_id,a_id,season,conference_game,tournament,tournament_type,tournament_round,tournament_game_no,attendance,venue_id,venue_city,venue_state,venue_address,venue_zip,venue_capacity,MOV,h_market,h_conf_id,h_conf_name,h_division_alias,h_points_game,a_market,a_conf_id,a_conf_name,a_division_alias,a_points_game,h_2PA,h_2PM,h_3PA,h_3PM,h_FTA,h_FTM,h_TRB,h_TO,h_Foul,h_Flagrant,h_Ejection,h_AST,h_STLA,h_BLKA
0,b4451a02-26c5-4005-9ac8-b06c1f71e661,ef13a371-76ed-409c-9aa6-35135183e170,68a3227f-677f-43b0-9a3a-cad79d0df9e2,2015,,,,,,2400.0,c69e13a7-4637-4b0e-9ca8-043ac5738a9d,Maui,HI,1840 Honoapiilani Hwy,96761,2400.0,-20,Chaminade University,ff8025b4-2752-413b-a6fe-4a5c36c47bab,Pacific West Conference,D2,73,UNLV,93a776e4-d390-48e1-95bb-74945457366a,Mountain West,D1,93,26,11,7,4,6,3,26,16,9,0,0,8,12,5
1,b2f579ca-9eff-4b2b-a747-81169399c2e8,ef13a371-76ed-409c-9aa6-35135183e170,fae4855b-1b64-4b40-a632-9ed345e1e952,2015,,,,,,2400.0,c69e13a7-4637-4b0e-9ca8-043ac5738a9d,Maui,HI,1840 Honoapiilani Hwy,96761,2400.0,-51,Chaminade University,ff8025b4-2752-413b-a6fe-4a5c36c47bab,Pacific West Conference,D2,72,Kansas,2853cf4d-6d62-4ec6-8e2c-d69f7a01a557,Big 12,D1,123,14,5,18,4,13,11,20,10,8,0,0,3,7,4
2,571be71c-a5bf-446e-bf21-30eb6c54ac5e,ef13a371-76ed-409c-9aa6-35135183e170,c1f4aae1-aa16-4095-aeab-10e5c2a1236a,2015,,,,,,2400.0,c69e13a7-4637-4b0e-9ca8-043ac5738a9d,Maui,HI,1840 Honoapiilani Hwy,96761,2400.0,-7,Chaminade University,ff8025b4-2752-413b-a6fe-4a5c36c47bab,Pacific West Conference,D2,93,St. John's,d07bc93e-c84c-44a9-a99d-c213bd0014d6,Big East,D1,100,14,9,15,7,7,3,11,11,0,0,0,9,7,2
3,d6617923-0b23-49e4-af9b-9e4d0243e45c,532d3874-b4b3-4c5c-acc6-749a6db26c8f,c009914b-3303-4dee-b915-978aa48a31d0,2015,,,,,,8032.0,1d1f74a2-7b35-56f0-8cbd-552c51cb2c14,Portland,OR,1 Center Court,97227,19441.0,13,Oregon State,04d5255d-b2dc-43df-9fa8-d296b0f8ccd7,Pacific 12,D1,82,Cal State Fullerton,5f56da49-5d81-43c3-8652-8b8da40c907f,Big West,D1,69,19,10,14,6,9,6,24,5,3,0,0,8,1,0
4,ffb463a4-dd3c-4ed9-b503-311b95ef0295,532d3874-b4b3-4c5c-acc6-749a6db26c8f,2959bd24-7007-41ae-a3a3-abdf26888cfc,2015,,,,,,8555.0,1d1f74a2-7b35-56f0-8cbd-552c51cb2c14,Portland,OR,1 Center Court,97227,19441.0,5,Oregon State,04d5255d-b2dc-43df-9fa8-d296b0f8ccd7,Pacific 12,D1,76,Tulsa,3b6a48d8-1f9c-484f-8ed0-ef0a540a0efe,American Athletic,D1,71,19,6,6,2,12,10,20,12,3,0,0,5,7,2
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
11158,9dfe8c82-8d85-42f7-b88d-5a3e2849c74c,bdb7d7a4-45f8-4bf3-ab85-15488c451494,9b166a3f-e64b-4825-bb6b-92c6f0418263,2016,False,,,,,,7b49816c-cac2-40d5-97bc-7c8c0935039d,Las Vegas,NV,4500 W. Tropicana Ave,89103,7471.0,4,Butler,d07bc93e-c84c-44a9-a99d-c213bd0014d6,Big East,D1,69,Arizona,04d5255d-b2dc-43df-9fa8-d296b0f8ccd7,Pacific 12,D1,65,16,6,10,5,11,9,13,7,8,0,0,6,3,1
11159,79e583e6-fffe-460e-821b-2157affad34f,d52c3640-069c-4554-982e-e6537c8044f1,0d8a328f-20ce-410b-bed1-15fc01308aaf,2017,False,,,,,,7b49816c-cac2-40d5-97bc-7c8c0935039d,Las Vegas,NV,4500 W Tropicana Ave,89103,9500.0,-19,George Washington,db136c00-f45b-4af6-bc7d-ffff216f2e5d,Atlantic 10,D1,64,Xavier,d07bc93e-c84c-44a9-a99d-c213bd0014d6,Big East,D1,83,15,5,13,7,9,5,16,10,3,0,0,5,6,0
11160,346a418b-995d-4a81-9d02-e567d6265878,fea46ac5-6dad-43cd-a770-75554dbcc118,7cdfcf92-7fe7-46f1-9b66-6912114182e6,2017,False,,,,,0.0,7b49816c-cac2-40d5-97bc-7c8c0935039d,Las Vegas,NV,4500 W Tropicana Ave,89103,9500.0,-10,Duquesne,db136c00-f45b-4af6-bc7d-ffff216f2e5d,Atlantic 10,D1,64,Southern Illinois,1d9219c1-696c-42a2-b1be-e8b438795521,Missouri Valley,D1,74,19,9,7,1,11,9,22,10,2,0,0,2,4,3
11161,7258d3e6-1b7e-4139-b4fb-7f469dbc4c39,820c8f26-cf11-4997-b2e2-19f47bd2f72f,92456e1e-f48c-4385-96ab-14cb27d18726,2016,False,Conference,Western Athletic,Quarterfinal 3,,1854.0,7b49816c-cac2-40d5-97bc-7c8c0935039d,Las Vegas,NV,4500 W. Tropicana Ave,89103,7471.0,4,UMKC,7265822b-247a-4991-ae8c-0e6f33f6122b,Western Athletic,D1,82,Texas Rio Grande Valley,7265822b-247a-4991-ae8c-0e6f33f6122b,Western Athletic,D1,78,25,8,10,3,20,13,27,9,13,0,0,4,6,0


In [24]:
g_data2.columns

Index(['game_id', 'h_id', 'a_id', 'season', 'conference_game', 'tournament',
       'tournament_type', 'tournament_round', 'tournament_game_no',
       'attendance', 'venue_id', 'venue_city', 'venue_state', 'venue_address',
       'venue_zip', 'venue_capacity', 'MOV', 'h_market', 'h_conf_id',
       'h_conf_name', 'h_division_alias', 'h_points_game', 'a_market',
       'a_conf_id', 'a_conf_name', 'a_division_alias', 'a_points_game',
       'h_2PA', 'h_2PM', 'h_3PA', 'h_3PM', 'h_FTA', 'h_FTM', 'h_TRB', 'h_TO',
       'h_Foul', 'h_Flagrant', 'h_Ejection', 'h_AST', 'h_STLA', 'h_BLKA'],
      dtype='object')

In [25]:
g_data3 = g_data2.merge(agg_data.add_prefix('a_'),how='inner',left_on=['game_id','a_id'],right_on=['game_id','team_id'])

In [26]:
display(g_data3)

Unnamed: 0,game_id,h_id,a_id,season,conference_game,tournament,tournament_type,tournament_round,tournament_game_no,attendance,venue_id,venue_city,venue_state,venue_address,venue_zip,venue_capacity,MOV,h_market,h_conf_id,h_conf_name,h_division_alias,h_points_game,a_market,a_conf_id,a_conf_name,a_division_alias,a_points_game,h_2PA,h_2PM,h_3PA,h_3PM,h_FTA,h_FTM,h_TRB,h_TO,h_Foul,h_Flagrant,h_Ejection,h_AST,h_STLA,h_BLKA,a_2PA,a_2PM,a_3PA,a_3PM,a_FTA,a_FTM,a_TRB,a_TO,a_Foul,a_Flagrant,a_Ejection,a_AST,a_STLA,a_BLKA
0,b4451a02-26c5-4005-9ac8-b06c1f71e661,ef13a371-76ed-409c-9aa6-35135183e170,68a3227f-677f-43b0-9a3a-cad79d0df9e2,2015,,,,,,2400.0,c69e13a7-4637-4b0e-9ca8-043ac5738a9d,Maui,HI,1840 Honoapiilani Hwy,96761,2400.0,-20,Chaminade University,ff8025b4-2752-413b-a6fe-4a5c36c47bab,Pacific West Conference,D2,73,UNLV,93a776e4-d390-48e1-95bb-74945457366a,Mountain West,D1,93,26,11,7,4,6,3,26,16,9,0,0,8,12,5,19,9,11,2,17,9,17,15,5,0,0,6,12,2
1,b2f579ca-9eff-4b2b-a747-81169399c2e8,ef13a371-76ed-409c-9aa6-35135183e170,fae4855b-1b64-4b40-a632-9ed345e1e952,2015,,,,,,2400.0,c69e13a7-4637-4b0e-9ca8-043ac5738a9d,Maui,HI,1840 Honoapiilani Hwy,96761,2400.0,-51,Chaminade University,ff8025b4-2752-413b-a6fe-4a5c36c47bab,Pacific West Conference,D2,72,Kansas,2853cf4d-6d62-4ec6-8e2c-d69f7a01a557,Big 12,D1,123,14,5,18,4,13,11,20,10,8,0,0,3,7,4,21,13,16,7,8,6,24,11,9,0,0,14,7,0
2,571be71c-a5bf-446e-bf21-30eb6c54ac5e,ef13a371-76ed-409c-9aa6-35135183e170,c1f4aae1-aa16-4095-aeab-10e5c2a1236a,2015,,,,,,2400.0,c69e13a7-4637-4b0e-9ca8-043ac5738a9d,Maui,HI,1840 Honoapiilani Hwy,96761,2400.0,-7,Chaminade University,ff8025b4-2752-413b-a6fe-4a5c36c47bab,Pacific West Conference,D2,93,St. John's,d07bc93e-c84c-44a9-a99d-c213bd0014d6,Big East,D1,100,14,9,15,7,7,3,11,11,0,0,0,9,7,2,19,13,12,9,6,6,13,10,3,0,0,10,7,0
3,d6617923-0b23-49e4-af9b-9e4d0243e45c,532d3874-b4b3-4c5c-acc6-749a6db26c8f,c009914b-3303-4dee-b915-978aa48a31d0,2015,,,,,,8032.0,1d1f74a2-7b35-56f0-8cbd-552c51cb2c14,Portland,OR,1 Center Court,97227,19441.0,13,Oregon State,04d5255d-b2dc-43df-9fa8-d296b0f8ccd7,Pacific 12,D1,82,Cal State Fullerton,5f56da49-5d81-43c3-8652-8b8da40c907f,Big West,D1,69,19,10,14,6,9,6,24,5,3,0,0,8,1,0,12,4,16,6,13,6,18,4,5,0,0,5,1,1
4,ffb463a4-dd3c-4ed9-b503-311b95ef0295,532d3874-b4b3-4c5c-acc6-749a6db26c8f,2959bd24-7007-41ae-a3a3-abdf26888cfc,2015,,,,,,8555.0,1d1f74a2-7b35-56f0-8cbd-552c51cb2c14,Portland,OR,1 Center Court,97227,19441.0,5,Oregon State,04d5255d-b2dc-43df-9fa8-d296b0f8ccd7,Pacific 12,D1,76,Tulsa,3b6a48d8-1f9c-484f-8ed0-ef0a540a0efe,American Athletic,D1,71,19,6,6,2,12,10,20,12,3,0,0,5,7,2,22,9,7,2,15,10,19,12,6,0,0,6,7,2
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
11158,9dfe8c82-8d85-42f7-b88d-5a3e2849c74c,bdb7d7a4-45f8-4bf3-ab85-15488c451494,9b166a3f-e64b-4825-bb6b-92c6f0418263,2016,False,,,,,,7b49816c-cac2-40d5-97bc-7c8c0935039d,Las Vegas,NV,4500 W. Tropicana Ave,89103,7471.0,4,Butler,d07bc93e-c84c-44a9-a99d-c213bd0014d6,Big East,D1,69,Arizona,04d5255d-b2dc-43df-9fa8-d296b0f8ccd7,Pacific 12,D1,65,16,6,10,5,11,9,13,7,8,0,0,6,3,1,19,9,8,3,11,7,20,10,6,0,0,7,3,2
11159,79e583e6-fffe-460e-821b-2157affad34f,d52c3640-069c-4554-982e-e6537c8044f1,0d8a328f-20ce-410b-bed1-15fc01308aaf,2017,False,,,,,,7b49816c-cac2-40d5-97bc-7c8c0935039d,Las Vegas,NV,4500 W Tropicana Ave,89103,9500.0,-19,George Washington,db136c00-f45b-4af6-bc7d-ffff216f2e5d,Atlantic 10,D1,64,Xavier,d07bc93e-c84c-44a9-a99d-c213bd0014d6,Big East,D1,83,15,5,13,7,9,5,16,10,3,0,0,5,6,0,26,14,7,4,5,3,19,10,3,0,0,8,6,4
11160,346a418b-995d-4a81-9d02-e567d6265878,fea46ac5-6dad-43cd-a770-75554dbcc118,7cdfcf92-7fe7-46f1-9b66-6912114182e6,2017,False,,,,,0.0,7b49816c-cac2-40d5-97bc-7c8c0935039d,Las Vegas,NV,4500 W Tropicana Ave,89103,9500.0,-10,Duquesne,db136c00-f45b-4af6-bc7d-ffff216f2e5d,Atlantic 10,D1,64,Southern Illinois,1d9219c1-696c-42a2-b1be-e8b438795521,Missouri Valley,D1,74,19,9,7,1,11,9,22,10,2,0,0,2,4,3,18,8,7,3,11,8,10,5,2,0,0,5,4,2
11161,7258d3e6-1b7e-4139-b4fb-7f469dbc4c39,820c8f26-cf11-4997-b2e2-19f47bd2f72f,92456e1e-f48c-4385-96ab-14cb27d18726,2016,False,Conference,Western Athletic,Quarterfinal 3,,1854.0,7b49816c-cac2-40d5-97bc-7c8c0935039d,Las Vegas,NV,4500 W. Tropicana Ave,89103,7471.0,4,UMKC,7265822b-247a-4991-ae8c-0e6f33f6122b,Western Athletic,D1,82,Texas Rio Grande Valley,7265822b-247a-4991-ae8c-0e6f33f6122b,Western Athletic,D1,78,25,8,10,3,20,13,27,9,13,0,0,4,6,0,15,5,12,5,22,13,23,11,12,0,0,5,6,1


In [27]:
type(g_data3)

pandas.core.frame.DataFrame

In [28]:
g_data4 = g_data3.set_index(['game_id'],verify_integrity=True)
display(g_data4)

Unnamed: 0_level_0,h_id,a_id,season,conference_game,tournament,tournament_type,tournament_round,tournament_game_no,attendance,venue_id,venue_city,venue_state,venue_address,venue_zip,venue_capacity,MOV,h_market,h_conf_id,h_conf_name,h_division_alias,h_points_game,a_market,a_conf_id,a_conf_name,a_division_alias,a_points_game,h_2PA,h_2PM,h_3PA,h_3PM,h_FTA,h_FTM,h_TRB,h_TO,h_Foul,h_Flagrant,h_Ejection,h_AST,h_STLA,h_BLKA,a_2PA,a_2PM,a_3PA,a_3PM,a_FTA,a_FTM,a_TRB,a_TO,a_Foul,a_Flagrant,a_Ejection,a_AST,a_STLA,a_BLKA
game_id,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1,Unnamed: 22_level_1,Unnamed: 23_level_1,Unnamed: 24_level_1,Unnamed: 25_level_1,Unnamed: 26_level_1,Unnamed: 27_level_1,Unnamed: 28_level_1,Unnamed: 29_level_1,Unnamed: 30_level_1,Unnamed: 31_level_1,Unnamed: 32_level_1,Unnamed: 33_level_1,Unnamed: 34_level_1,Unnamed: 35_level_1,Unnamed: 36_level_1,Unnamed: 37_level_1,Unnamed: 38_level_1,Unnamed: 39_level_1,Unnamed: 40_level_1,Unnamed: 41_level_1,Unnamed: 42_level_1,Unnamed: 43_level_1,Unnamed: 44_level_1,Unnamed: 45_level_1,Unnamed: 46_level_1,Unnamed: 47_level_1,Unnamed: 48_level_1,Unnamed: 49_level_1,Unnamed: 50_level_1,Unnamed: 51_level_1,Unnamed: 52_level_1,Unnamed: 53_level_1,Unnamed: 54_level_1
b4451a02-26c5-4005-9ac8-b06c1f71e661,ef13a371-76ed-409c-9aa6-35135183e170,68a3227f-677f-43b0-9a3a-cad79d0df9e2,2015,,,,,,2400.0,c69e13a7-4637-4b0e-9ca8-043ac5738a9d,Maui,HI,1840 Honoapiilani Hwy,96761,2400.0,-20,Chaminade University,ff8025b4-2752-413b-a6fe-4a5c36c47bab,Pacific West Conference,D2,73,UNLV,93a776e4-d390-48e1-95bb-74945457366a,Mountain West,D1,93,26,11,7,4,6,3,26,16,9,0,0,8,12,5,19,9,11,2,17,9,17,15,5,0,0,6,12,2
b2f579ca-9eff-4b2b-a747-81169399c2e8,ef13a371-76ed-409c-9aa6-35135183e170,fae4855b-1b64-4b40-a632-9ed345e1e952,2015,,,,,,2400.0,c69e13a7-4637-4b0e-9ca8-043ac5738a9d,Maui,HI,1840 Honoapiilani Hwy,96761,2400.0,-51,Chaminade University,ff8025b4-2752-413b-a6fe-4a5c36c47bab,Pacific West Conference,D2,72,Kansas,2853cf4d-6d62-4ec6-8e2c-d69f7a01a557,Big 12,D1,123,14,5,18,4,13,11,20,10,8,0,0,3,7,4,21,13,16,7,8,6,24,11,9,0,0,14,7,0
571be71c-a5bf-446e-bf21-30eb6c54ac5e,ef13a371-76ed-409c-9aa6-35135183e170,c1f4aae1-aa16-4095-aeab-10e5c2a1236a,2015,,,,,,2400.0,c69e13a7-4637-4b0e-9ca8-043ac5738a9d,Maui,HI,1840 Honoapiilani Hwy,96761,2400.0,-7,Chaminade University,ff8025b4-2752-413b-a6fe-4a5c36c47bab,Pacific West Conference,D2,93,St. John's,d07bc93e-c84c-44a9-a99d-c213bd0014d6,Big East,D1,100,14,9,15,7,7,3,11,11,0,0,0,9,7,2,19,13,12,9,6,6,13,10,3,0,0,10,7,0
d6617923-0b23-49e4-af9b-9e4d0243e45c,532d3874-b4b3-4c5c-acc6-749a6db26c8f,c009914b-3303-4dee-b915-978aa48a31d0,2015,,,,,,8032.0,1d1f74a2-7b35-56f0-8cbd-552c51cb2c14,Portland,OR,1 Center Court,97227,19441.0,13,Oregon State,04d5255d-b2dc-43df-9fa8-d296b0f8ccd7,Pacific 12,D1,82,Cal State Fullerton,5f56da49-5d81-43c3-8652-8b8da40c907f,Big West,D1,69,19,10,14,6,9,6,24,5,3,0,0,8,1,0,12,4,16,6,13,6,18,4,5,0,0,5,1,1
ffb463a4-dd3c-4ed9-b503-311b95ef0295,532d3874-b4b3-4c5c-acc6-749a6db26c8f,2959bd24-7007-41ae-a3a3-abdf26888cfc,2015,,,,,,8555.0,1d1f74a2-7b35-56f0-8cbd-552c51cb2c14,Portland,OR,1 Center Court,97227,19441.0,5,Oregon State,04d5255d-b2dc-43df-9fa8-d296b0f8ccd7,Pacific 12,D1,76,Tulsa,3b6a48d8-1f9c-484f-8ed0-ef0a540a0efe,American Athletic,D1,71,19,6,6,2,12,10,20,12,3,0,0,5,7,2,22,9,7,2,15,10,19,12,6,0,0,6,7,2
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
9dfe8c82-8d85-42f7-b88d-5a3e2849c74c,bdb7d7a4-45f8-4bf3-ab85-15488c451494,9b166a3f-e64b-4825-bb6b-92c6f0418263,2016,False,,,,,,7b49816c-cac2-40d5-97bc-7c8c0935039d,Las Vegas,NV,4500 W. Tropicana Ave,89103,7471.0,4,Butler,d07bc93e-c84c-44a9-a99d-c213bd0014d6,Big East,D1,69,Arizona,04d5255d-b2dc-43df-9fa8-d296b0f8ccd7,Pacific 12,D1,65,16,6,10,5,11,9,13,7,8,0,0,6,3,1,19,9,8,3,11,7,20,10,6,0,0,7,3,2
79e583e6-fffe-460e-821b-2157affad34f,d52c3640-069c-4554-982e-e6537c8044f1,0d8a328f-20ce-410b-bed1-15fc01308aaf,2017,False,,,,,,7b49816c-cac2-40d5-97bc-7c8c0935039d,Las Vegas,NV,4500 W Tropicana Ave,89103,9500.0,-19,George Washington,db136c00-f45b-4af6-bc7d-ffff216f2e5d,Atlantic 10,D1,64,Xavier,d07bc93e-c84c-44a9-a99d-c213bd0014d6,Big East,D1,83,15,5,13,7,9,5,16,10,3,0,0,5,6,0,26,14,7,4,5,3,19,10,3,0,0,8,6,4
346a418b-995d-4a81-9d02-e567d6265878,fea46ac5-6dad-43cd-a770-75554dbcc118,7cdfcf92-7fe7-46f1-9b66-6912114182e6,2017,False,,,,,0.0,7b49816c-cac2-40d5-97bc-7c8c0935039d,Las Vegas,NV,4500 W Tropicana Ave,89103,9500.0,-10,Duquesne,db136c00-f45b-4af6-bc7d-ffff216f2e5d,Atlantic 10,D1,64,Southern Illinois,1d9219c1-696c-42a2-b1be-e8b438795521,Missouri Valley,D1,74,19,9,7,1,11,9,22,10,2,0,0,2,4,3,18,8,7,3,11,8,10,5,2,0,0,5,4,2
7258d3e6-1b7e-4139-b4fb-7f469dbc4c39,820c8f26-cf11-4997-b2e2-19f47bd2f72f,92456e1e-f48c-4385-96ab-14cb27d18726,2016,False,Conference,Western Athletic,Quarterfinal 3,,1854.0,7b49816c-cac2-40d5-97bc-7c8c0935039d,Las Vegas,NV,4500 W. Tropicana Ave,89103,7471.0,4,UMKC,7265822b-247a-4991-ae8c-0e6f33f6122b,Western Athletic,D1,82,Texas Rio Grande Valley,7265822b-247a-4991-ae8c-0e6f33f6122b,Western Athletic,D1,78,25,8,10,3,20,13,27,9,13,0,0,4,6,0,15,5,12,5,22,13,23,11,12,0,0,5,6,1


In [29]:
df = g_data4.loc[(g_data4['h_division_alias']=='D1')&(g_data4['a_division_alias']=='D1')]

In [30]:
display(df)

Unnamed: 0_level_0,h_id,a_id,season,conference_game,tournament,tournament_type,tournament_round,tournament_game_no,attendance,venue_id,venue_city,venue_state,venue_address,venue_zip,venue_capacity,MOV,h_market,h_conf_id,h_conf_name,h_division_alias,h_points_game,a_market,a_conf_id,a_conf_name,a_division_alias,a_points_game,h_2PA,h_2PM,h_3PA,h_3PM,h_FTA,h_FTM,h_TRB,h_TO,h_Foul,h_Flagrant,h_Ejection,h_AST,h_STLA,h_BLKA,a_2PA,a_2PM,a_3PA,a_3PM,a_FTA,a_FTM,a_TRB,a_TO,a_Foul,a_Flagrant,a_Ejection,a_AST,a_STLA,a_BLKA
game_id,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1,Unnamed: 22_level_1,Unnamed: 23_level_1,Unnamed: 24_level_1,Unnamed: 25_level_1,Unnamed: 26_level_1,Unnamed: 27_level_1,Unnamed: 28_level_1,Unnamed: 29_level_1,Unnamed: 30_level_1,Unnamed: 31_level_1,Unnamed: 32_level_1,Unnamed: 33_level_1,Unnamed: 34_level_1,Unnamed: 35_level_1,Unnamed: 36_level_1,Unnamed: 37_level_1,Unnamed: 38_level_1,Unnamed: 39_level_1,Unnamed: 40_level_1,Unnamed: 41_level_1,Unnamed: 42_level_1,Unnamed: 43_level_1,Unnamed: 44_level_1,Unnamed: 45_level_1,Unnamed: 46_level_1,Unnamed: 47_level_1,Unnamed: 48_level_1,Unnamed: 49_level_1,Unnamed: 50_level_1,Unnamed: 51_level_1,Unnamed: 52_level_1,Unnamed: 53_level_1,Unnamed: 54_level_1
d6617923-0b23-49e4-af9b-9e4d0243e45c,532d3874-b4b3-4c5c-acc6-749a6db26c8f,c009914b-3303-4dee-b915-978aa48a31d0,2015,,,,,,8032.0,1d1f74a2-7b35-56f0-8cbd-552c51cb2c14,Portland,OR,1 Center Court,97227,19441.0,13,Oregon State,04d5255d-b2dc-43df-9fa8-d296b0f8ccd7,Pacific 12,D1,82,Cal State Fullerton,5f56da49-5d81-43c3-8652-8b8da40c907f,Big West,D1,69,19,10,14,6,9,6,24,5,3,0,0,8,1,0,12,4,16,6,13,6,18,4,5,0,0,5,1,1
ffb463a4-dd3c-4ed9-b503-311b95ef0295,532d3874-b4b3-4c5c-acc6-749a6db26c8f,2959bd24-7007-41ae-a3a3-abdf26888cfc,2015,,,,,,8555.0,1d1f74a2-7b35-56f0-8cbd-552c51cb2c14,Portland,OR,1 Center Court,97227,19441.0,5,Oregon State,04d5255d-b2dc-43df-9fa8-d296b0f8ccd7,Pacific 12,D1,76,Tulsa,3b6a48d8-1f9c-484f-8ed0-ef0a540a0efe,American Athletic,D1,71,19,6,6,2,12,10,20,12,3,0,0,5,7,2,22,9,7,2,15,10,19,12,6,0,0,6,7,2
1063177e-e168-4055-bdbf-a7fd1e33f398,9fccbf28-2858-4263-821c-fdefb3c7efa3,efba5350-79bc-47aa-a189-db177b95b491,2015,,NCAA,South Regional,First Round,Game 2,16628.0,786bfe1c-6fa3-4177-a207-0242f7f68bfb,Des Moines,IA,730 3rd Street,50309,16110.0,-7,Colorado,04d5255d-b2dc-43df-9fa8-d296b0f8ccd7,Pacific 12,D1,67,Connecticut,3b6a48d8-1f9c-484f-8ed0-ef0a540a0efe,American Athletic,D1,74,20,11,6,2,13,8,20,7,4,0,0,5,5,3,19,7,11,3,4,4,15,8,8,0,0,4,5,2
60b9ce90-41cb-4158-8038-1f9f80b374a5,532d3874-b4b3-4c5c-acc6-749a6db26c8f,c1c1e6df-a383-4fbd-ba7b-32d4f9ef9518,2015,,NCAA,West Regional,First Round,Game 7,15662.0,a13af216-4409-5021-8dd5-255cc71bffc3,Oklahoma City,OK,100 W. Reno Ave.,73102,18203.0,-8,Oregon State,04d5255d-b2dc-43df-9fa8-d296b0f8ccd7,Pacific 12,D1,67,Virginia Commonwealth,db136c00-f45b-4af6-bc7d-ffff216f2e5d,Atlantic 10,D1,75,23,8,7,3,5,3,15,4,5,0,0,6,3,3,18,13,9,1,8,7,18,6,8,0,0,8,3,1
267af1b7-9c86-4561-bf63-7a379cdaae6d,9b166a3f-e64b-4825-bb6b-92c6f0418263,f38b58de-3273-4723-a78b-2f918e9aa2d5,2015,,NCAA,South Regional,First Round,Game 5,11559.0,94e2afc1-0309-408f-84fb-2f80cbda0357,Providence,RI,101 Sabin Street,2903,12400.0,-10,Arizona,04d5255d-b2dc-43df-9fa8-d296b0f8ccd7,Pacific 12,D1,55,Wichita State,3b6a48d8-1f9c-484f-8ed0-ef0a540a0efe,American Athletic,D1,65,13,3,9,3,7,4,19,12,6,0,0,2,7,0,20,12,14,2,2,1,19,8,5,0,0,2,7,0
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
9dfe8c82-8d85-42f7-b88d-5a3e2849c74c,bdb7d7a4-45f8-4bf3-ab85-15488c451494,9b166a3f-e64b-4825-bb6b-92c6f0418263,2016,False,,,,,,7b49816c-cac2-40d5-97bc-7c8c0935039d,Las Vegas,NV,4500 W. Tropicana Ave,89103,7471.0,4,Butler,d07bc93e-c84c-44a9-a99d-c213bd0014d6,Big East,D1,69,Arizona,04d5255d-b2dc-43df-9fa8-d296b0f8ccd7,Pacific 12,D1,65,16,6,10,5,11,9,13,7,8,0,0,6,3,1,19,9,8,3,11,7,20,10,6,0,0,7,3,2
79e583e6-fffe-460e-821b-2157affad34f,d52c3640-069c-4554-982e-e6537c8044f1,0d8a328f-20ce-410b-bed1-15fc01308aaf,2017,False,,,,,,7b49816c-cac2-40d5-97bc-7c8c0935039d,Las Vegas,NV,4500 W Tropicana Ave,89103,9500.0,-19,George Washington,db136c00-f45b-4af6-bc7d-ffff216f2e5d,Atlantic 10,D1,64,Xavier,d07bc93e-c84c-44a9-a99d-c213bd0014d6,Big East,D1,83,15,5,13,7,9,5,16,10,3,0,0,5,6,0,26,14,7,4,5,3,19,10,3,0,0,8,6,4
346a418b-995d-4a81-9d02-e567d6265878,fea46ac5-6dad-43cd-a770-75554dbcc118,7cdfcf92-7fe7-46f1-9b66-6912114182e6,2017,False,,,,,0.0,7b49816c-cac2-40d5-97bc-7c8c0935039d,Las Vegas,NV,4500 W Tropicana Ave,89103,9500.0,-10,Duquesne,db136c00-f45b-4af6-bc7d-ffff216f2e5d,Atlantic 10,D1,64,Southern Illinois,1d9219c1-696c-42a2-b1be-e8b438795521,Missouri Valley,D1,74,19,9,7,1,11,9,22,10,2,0,0,2,4,3,18,8,7,3,11,8,10,5,2,0,0,5,4,2
7258d3e6-1b7e-4139-b4fb-7f469dbc4c39,820c8f26-cf11-4997-b2e2-19f47bd2f72f,92456e1e-f48c-4385-96ab-14cb27d18726,2016,False,Conference,Western Athletic,Quarterfinal 3,,1854.0,7b49816c-cac2-40d5-97bc-7c8c0935039d,Las Vegas,NV,4500 W. Tropicana Ave,89103,7471.0,4,UMKC,7265822b-247a-4991-ae8c-0e6f33f6122b,Western Athletic,D1,82,Texas Rio Grande Valley,7265822b-247a-4991-ae8c-0e6f33f6122b,Western Athletic,D1,78,25,8,10,3,20,13,27,9,13,0,0,4,6,0,15,5,12,5,22,13,23,11,12,0,0,5,6,1


In [31]:
df.shape

(11058, 54)

In [32]:
df["season"].unique()







array([2015, 2013, 2014, 2017, 2016], dtype=int64)

In [33]:
#Checking how many games are tournament
df['tournament'].unique()

array([nan, 'NCAA', 'Conference'], dtype=object)

In [34]:
df['tournament_type'].unique()

array([nan, 'South Regional', 'West Regional', 'Midwest Regional',
       'East Regional', 'SCAR Bracket', 'Pac', 'CBI', 'Ohio Valley',
       'CIT', 'Missouri Valley', 'Horizon League', 'Valparaiso Bracket',
       'Final Four', 'Big 12', 'Sun Belt', 'Big South', 'Big Sky',
       'American Athletic', 'Southern', 'Summit League', 'Big West',
       'Vegas 16', 'Conference USA', 'Southland', 'First Four', 'MEAC',
       'ACC', 'National Championship', 'SBON Bracket', 'Atlantic Sun',
       'Monmouth Bracket', 'Patriot League', 'Mountain West',
       'Southeastern', 'Mid', 'Big Ten', 'America East', 'Northeast',
       'Colonial Athletic', 'MAAC', 'Colorado St. Bracket',
       'Old Dominion Bracket', 'Temple Bracket', 'Richmond Bracket',
       'SWAC', 'Atlantic Coast', 'SEC', 'California Bracket',
       'Illinois St Bracket', 'Iowa Bracket', 'Syracuse Bracket',
       'Southwest Athletic', 'Ivy League', 'Atlantic 10',
       'Metro Atlantic', 'NIT', 'Big East', 'Western Athletic',
 

In [57]:
client.close()

In [36]:
df.to_csv()

'game_id,h_id,a_id,season,conference_game,tournament,tournament_type,tournament_round,tournament_game_no,attendance,venue_id,venue_city,venue_state,venue_address,venue_zip,venue_capacity,MOV,h_market,h_conf_id,h_conf_name,h_division_alias,h_points_game,a_market,a_conf_id,a_conf_name,a_division_alias,a_points_game,h_2PA,h_2PM,h_3PA,h_3PM,h_FTA,h_FTM,h_TRB,h_TO,h_Foul,h_Flagrant,h_Ejection,h_AST,h_STLA,h_BLKA,a_2PA,a_2PM,a_3PA,a_3PM,a_FTA,a_FTM,a_TRB,a_TO,a_Foul,a_Flagrant,a_Ejection,a_AST,a_STLA,a_BLKA\r\nd6617923-0b23-49e4-af9b-9e4d0243e45c,532d3874-b4b3-4c5c-acc6-749a6db26c8f,c009914b-3303-4dee-b915-978aa48a31d0,2015,,,,,,8032.0,1d1f74a2-7b35-56f0-8cbd-552c51cb2c14,Portland,OR,1 Center Court,97227,19441.0,13,Oregon State,04d5255d-b2dc-43df-9fa8-d296b0f8ccd7,Pacific 12,D1,82,Cal State Fullerton,5f56da49-5d81-43c3-8652-8b8da40c907f,Big West,D1,69,19,10,14,6,9,6,24,5,3,0,0,8,1,0,12,4,16,6,13,6,18,4,5,0,0,5,1,1\r\nffb463a4-dd3c-4ed9-b503-311b95ef0295,532d3874-b4b3-4c5c-acc6-749a6db26c8f,2