In [None]:
%load_ext autoreload
%autoreload 2

import os
import sys

module_path = os.path.abspath(os.path.join(os.pardir, os.pardir))
if module_path not in sys.path:
    sys.path.append(module_path)

import pandas as pd
import numpy as np
import seaborn as sns

# 1. Initial Setup

**Download Datasets**

The following datasets will be used for modeling:

- NBA Advanced Metrics from FiveThirtyEight (csv) - Publicly available: 
https://github.com/fivethirtyeight/nba-player-advanced-metrics

- Clone repo into the data folder in this projects main directory.

```bash
# navigate to the data folder and run
git clone https://github.com/fivethirtyeight/nba-player-advanced-metrics.git
```

- NCAA Dataset was provided with written permission from barttorvik.com (csv) - In order to work with the data on the site without the need to scrape, get in touch with him via twitter direct message and explain what you will be using it for. If approved, he will provide instructions for obtaining the necessary data. 

    — Follow the provided instructions to create a dataset with the following filters:

    - data from 2008-2019
    - drafted = True
    
Store csv in the data folder in this projects main directory



# 2. Import Data

In [None]:
raptor_df = pd.read_csv('../../data/nba-player-advanced-metrics/nba-data-historical.csv', encoding='latin-1')

In [None]:
ncaa_df = pd.read_csv('../../data/ncaa_stats.csv', header=None)

# 3. Create SQLite Database

In [None]:
import sqlite3
from sqlite3 import Error

def create_connection(db_file):
    """ create a database connection to a SQLite database """
    conn = None
    try:
        conn = sqlite3.connect(db_file)
        print(sqlite3.version)
    except Error as e:
        print(e)
    finally:
        if conn:
            conn.close()

if __name__ == '__main__':
    create_connection(r"AI_SCOUT.db")

# 4. Save Tables to AI_SCOUT.db

In [None]:
conn = sqlite3.connect('AI_SCOUT.db')

In [None]:
raptor_df.to_sql('RAPTOR', conn, if_exists='replace', index=False)

In [None]:
ncaa_df.to_sql('NCAA', conn, if_exists='replace', index=False)

# 5. Close Connection

In [None]:
conn.close()