## Selenium on footballDB

In [1]:
%matplotlib inline
import pandas as pd
import numpy as np
import re
import time
import selenium
from selenium import webdriver
from selenium.webdriver.common.keys import Keys
from selenium.webdriver.support.ui import Select
from selenium.webdriver.common.action_chains import ActionChains
from selenium.webdriver.support import expected_conditions as EC
from selenium.webdriver.common.by import By
from selenium.webdriver.support.ui import WebDriverWait
from bs4 import BeautifulSoup
import warnings
warnings.filterwarnings('ignore')

import urllib
import requests

In [2]:
# HTMLTableParser from:
# https://srome.github.io/Parsing-HTML-Tables-in-Python-with-BeautifulSoup-and-pandas/
class HTMLTableParser:
       
        def parse_url(self, url):
            response = requests.get(url)
            soup = BeautifulSoup(response.text, 'lxml')
            return [(table['id'],self.parse_html_table(table))\
                    for table in soup.find_all('table')]  
        
        
        def parse_html_table(self, table):
            n_columns = 0
            n_rows=0
            column_names = []
    
            # Find number of rows and columns
            # we also find the column titles if we can
            for row in table.find_all('tr'):
                
                # Determine the number of rows in the table
                td_tags = row.find_all('td')
                if len(td_tags) > 0:
                    n_rows+=1
                    if n_columns == 0:
                        # Set the number of columns for our table
                        n_columns = len(td_tags)
                        
                # Handle column names if we find them
                th_tags = row.find_all('th') 
                if len(th_tags) > 0 and len(column_names) == 0:
                    for th in th_tags:
                        column_names.append(th.get_text())
    
            # Safeguard on Column Titles
            if len(column_names) > 0 and len(column_names) != n_columns:
                raise Exception("Column titles do not match the number of columns")
    
            columns = column_names if len(column_names) > 0 else range(0,n_columns)
            df = pd.DataFrame(columns = columns,
                              index= range(0,n_rows))
            row_marker = 0
            for row in table.find_all('tr'):
                column_marker = 0
                columns = row.find_all('td')
                for column in columns:
                    df.iat[row_marker,column_marker] = column.get_text()
                    column_marker += 1
                if len(columns) > 0:
                    row_marker += 1
                    
            # Convert to float if possible
            for col in df:
                try:
                    df[col] = df[col].astype(float)
                except ValueError:
                    pass
            
            return df

In [3]:
def get_player_table(url, cat):
    hp = HTMLTableParser()
    table = hp.parse_url(url)[0][1] # Grabbing the table from the tuple

    # Fix up headers
    cols = list(table.columns)
    new_cols = [col.strip('\n') for col in cols]
    table.columns = new_cols

    table['Name'] = table['Name'].str.replace('\n', '').str.replace(cat, '').str.strip()
    return table.copy()

### Power Up Players

In [4]:
df_list = []

for page_num in range(1,9):   
    url = f'https://www.muthead.com/19/players?filter-market=3&filter-program-19=229&page={page_num}'
    df_list.append(get_player_table(url, 'Power Up'))
    time.sleep(2)
        
mut_data = pd.concat(df_list)

In [5]:
mut_data.head()

Unnamed: 0,Unnamed: 1,Name,OVR,POS,PS4
0,,Ed Reed,75.0,SS,6150
1,,Steve Smith Sr,75.0,WR,3550
2,,Ronde Barber,74.0,CB,2500
3,,Dermontti Dawson,74.0,C,3050
4,,Eddie George,74.0,HB,2750


In [8]:
mut_data.shape

(177, 5)

### Hall Of Fame Players

In [9]:
url2 = 'https://www.muthead.com/19/players?filter-program-19=238&filter-market=3&&filter-tier=8'
hof_df = get_player_table(url2, 'Hall of Fame')

In [10]:
hof_df

Unnamed: 0,Unnamed: 1,Name,OVR,POS,PS4
0,,Terrell Davis,77.0,HB,13.0K
1,,Dan Marino,77.0,QB,13.5K
2,,Terrell Owens,77.0,WR,12.2K
3,,Brian Urlacher,77.0,MLB,13.0K
4,,Rod Woodson,77.0,CB,12.2K


### Master Players

In [12]:
url3 = 'https://www.muthead.com/19/players?filter-program-19=236&filter-market=3&'
master_df = get_player_table(url3, 'Master')

In [13]:
master_df

Unnamed: 0,Unnamed: 1,Name,OVR,POS,PS4
0,,Ryan Shazier,70.0,MLB,
1,,Ricky Williams,70.0,HB,


### Team Captains

In [14]:
url4 = 'https://www.muthead.com/19/players?filter-program-19=244&filter-market=3&'
team_captains = get_player_table(url4, 'Team Captain')

In [15]:
team_captains

Unnamed: 0,Unnamed: 1,Name,OVR,POS,PS4
0,,Ray Lewis,75.0,MLB,
1,,Jerry Rice,75.0,WR,
2,,Shannon Sharpe,75.0,TE,
3,,Michael Strahan,75.0,LE,


In [16]:
mut_cats = [mut_data, hof_df, master_df, team_captains]
all_players = pd.concat(mut_cats).reset_index(drop=True)

In [17]:
all_players.shape

(188, 5)

In [21]:
mut_data.shape

(177, 5)

In [22]:
mut_data.to_csv('mut_data_oct13.csv')
all_players.to_csv('mut_pu_data_oct13.csv')

In [23]:
all_players.head(10)

Unnamed: 0,Unnamed: 1,Name,OVR,POS,PS4
0,,Ed Reed,75.0,SS,6150
1,,Steve Smith Sr,75.0,WR,3550
2,,Ronde Barber,74.0,CB,2500
3,,Dermontti Dawson,74.0,C,3050
4,,Eddie George,74.0,HB,2750
5,,Kevin Greene,74.0,LOLB,3450
6,,Donovan McNabb,74.0,QB,2850
7,,Jonathan Ogden,74.0,LT,2650
8,,Deion Sanders,74.0,CB,5950
9,,Lawrence Taylor,74.0,ROLB,3850


In [24]:
previous_df = pd.read_csv('/Users/mattjohnson/Desktop/Python2018/MUT/all_powerups.csv')
previous_df.drop('Unnamed: 0', axis=1, inplace=True)

In [25]:
previous_df

Unnamed: 0,Name,OVR,POS,PS4,firstName,lastName,POS2,Player,Pos,College,...,Oak,Phi,Pit,SF,Sea,TB,Ten,Was,RAMS,CHARGERS
0,Champ Bailey,73,CB,2000,Champ,Bailey,DB,"Bailey, Champ",DB,Georgia,...,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0,0
1,Randy Moss,73,WR,3400,Randy,Moss,WR,"Moss, Randy",WR,Marshall,...,1.0,0.0,0.0,1.0,0.0,0.0,1.0,0.0,0,0
2,Michael Vick,73,QB,4100,Michael,Vick,QB,"Vick, Michael",QB,Virginia Tech,...,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0,0
3,Reggie White,73,LE,1900,Reggie,White,DE,"White, Reggie",DE,Tennessee,...,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0
4,Derrick Brooks,72,ROLB,2800,Derrick,Brooks,LB,"Brooks, Derrick",LB,Florida State,...,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0,0
5,Ted Hendricks,72,LOLB,1800,Ted,Hendricks,LB,"Hendricks, Ted",LB,Miami,...,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1,0
6,Steve Hutchinson,72,LG,2600,Steve,Hutchinson,OG,"Hutchinson, Steve",OG,Michigan,...,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0,0
7,Lorenzo Neal,72,FB,4000,Lorenzo,Neal,RB,"Neal, Lorenzo",RB,Fresno State,...,0.0,0.0,0.0,0.0,0.0,1.0,1.0,0.0,0,1
8,Willie Roaf,72,LT,1500,Willie,Roaf,OT,"Roaf, Willie",OT,Louisiana Tech,...,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0
9,Bruce Smith,72,RE,2200,Bruce,Smith,DE,"Smith, Bruce",DE,Virginia Tech,...,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0,0


In [27]:
prev_names = set(previous_df['Name'].values)
curr_names = set(all_players['Name'].values)

inter = prev_names.intersection(curr_names)
d1 = prev_names.difference(curr_names)
d2 = curr_names.difference(prev_names)
print(len(prev_names), len(curr_names))
print(len(d1), len(d2), len(inter))

155 188
0 33 155


In [28]:
d2

{'Aeneas Williams',
 'Barry Sanders',
 'Brian Dawkins',
 'Brian Urlacher',
 'Dan Marino',
 'DeMarcus Ware',
 'Deion Sanders',
 'Derek Carr',
 'Dermontti Dawson',
 'Donovan McNabb',
 "Dont'a Hightower",
 'Ed Reed',
 'Eddie George',
 'Ha Ha Clinton-Dix',
 'Jerry Rice',
 'John Randle',
 'Jonathan Ogden',
 'Kevin Greene',
 'Larry Allen',
 'Lawrence Taylor',
 'Michael Strahan',
 'Patrick Mahomes',
 'Ray Lewis',
 'Ricky Williams',
 'Rod Woodson',
 'Ronde Barber',
 'Ryan Shazier',
 'Shannon Sharpe',
 'Steve Smith Sr',
 'Terrell Davis',
 'Terrell Owens',
 'Tim Brown',
 'Tony Gonzalez'}

In [29]:
for _ in d2:
    print(_)

Eddie George
Jerry Rice
Shannon Sharpe
Derek Carr
Ray Lewis
Barry Sanders
Ronde Barber
Tony Gonzalez
Lawrence Taylor
Dan Marino
Dermontti Dawson
John Randle
Aeneas Williams
Michael Strahan
Ha Ha Clinton-Dix
Kevin Greene
Dont'a Hightower
Ed Reed
Patrick Mahomes
Donovan McNabb
Terrell Davis
Jonathan Ogden
Brian Urlacher
Ricky Williams
Deion Sanders
Larry Allen
Steve Smith Sr
Rod Woodson
Tim Brown
Brian Dawkins
Terrell Owens
DeMarcus Ware
Ryan Shazier


In [30]:
previous_df.head()

Unnamed: 0,Name,OVR,POS,PS4,firstName,lastName,POS2,Player,Pos,College,...,Oak,Phi,Pit,SF,Sea,TB,Ten,Was,RAMS,CHARGERS
0,Champ Bailey,73,CB,2000,Champ,Bailey,DB,"Bailey, Champ",DB,Georgia,...,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0,0
1,Randy Moss,73,WR,3400,Randy,Moss,WR,"Moss, Randy",WR,Marshall,...,1.0,0.0,0.0,1.0,0.0,0.0,1.0,0.0,0,0
2,Michael Vick,73,QB,4100,Michael,Vick,QB,"Vick, Michael",QB,Virginia Tech,...,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0,0
3,Reggie White,73,LE,1900,Reggie,White,DE,"White, Reggie",DE,Tennessee,...,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0
4,Derrick Brooks,72,ROLB,2800,Derrick,Brooks,LB,"Brooks, Derrick",LB,Florida State,...,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0,0


In [31]:
all_players.head()

Unnamed: 0,Unnamed: 1,Name,OVR,POS,PS4
0,,Ed Reed,75.0,SS,6150
1,,Steve Smith Sr,75.0,WR,3550
2,,Ronde Barber,74.0,CB,2500
3,,Dermontti Dawson,74.0,C,3050
4,,Eddie George,74.0,HB,2750


In [32]:
#powerups = pd.read_csv('madden19_powerups.csv')

#cols = powerups.columns.drop('Unnamed: 4')
#powerups.drop('Name', axis=1, inplace=True)
#powerups.columns = cols

powerups = all_players.copy()

#powerups['Name'] = powerups['Name'].str[:-8]

df2 = pd.DataFrame(powerups['Name'].str.split())
powerups.loc[:, 'firstName'] = df2.Name.map(lambda x: x[0])
powerups.loc[:, 'lastName'] = df2.Name.map(lambda x: ' '.join(x[1:]))

powerups['POS'].value_counts()

position_dict = {'CB':'DB', 'SS':'DB', 'FS':'DB', 'WR':'WR', 'QB':'QB', 'HB':'RB', 'FB':'RB', 
        'TE':'TE', 'LE':'DE', 'RE':'DE', 'DT':'DT', 'LOLB':'LB', 'ROLB':'LB', 'MLB':'LB', 
        'LG':'OG', 'RG':'OG', 'LT':'OT', 'RT':'OT', 'C':'C'}

powerups['POS2'] = powerups['POS'].map(position_dict)

In [34]:
unfins = list(powerups[ powerups['Name'].isin(d2)].index)

In [35]:
powerups.head()

Unnamed: 0,Unnamed: 1,Name,OVR,POS,PS4,firstName,lastName,POS2
0,,Ed Reed,75.0,SS,6150,Ed,Reed,DB
1,,Steve Smith Sr,75.0,WR,3550,Steve,Smith Sr,WR
2,,Ronde Barber,74.0,CB,2500,Ronde,Barber,DB
3,,Dermontti Dawson,74.0,C,3050,Dermontti,Dawson,C
4,,Eddie George,74.0,HB,2750,Eddie,George,RB


In [36]:
powerups.tail()

Unnamed: 0,Unnamed: 1,Name,OVR,POS,PS4,firstName,lastName,POS2
183,,Ricky Williams,70.0,HB,,Ricky,Williams,RB
184,,Ray Lewis,75.0,MLB,,Ray,Lewis,LB
185,,Jerry Rice,75.0,WR,,Jerry,Rice,WR
186,,Shannon Sharpe,75.0,TE,,Shannon,Sharpe,TE
187,,Michael Strahan,75.0,LE,,Michael,Strahan,DE


In [37]:
print(powerups.shape)

(188, 8)


In [38]:
def get_player_teams(first_name, last_name, playerPos, driver):

    try:
        # Clearing the search field text box
        driver.find_element_by_xpath( \
            '/html/body/div[1]/div[1]/div[1]/div[3]/div[5]/form/input[1]').clear()

        # Sending the last name of current player
        driver.find_element_by_xpath( \
            '/html/body/div[1]/div[1]/div[1]/div[3]/div[5]/form/input[1]').send_keys(last_name)

        # Clicking the submit button to search
        driver.find_element_by_xpath( \
        '/html/body/div[1]/div[1]/div[1]/div[3]/div[5]/form/input[2]').click()
        time.sleep(2)
    
        html = driver.page_source
        soup = BeautifulSoup(html, 'lxml')
        tables = soup.find_all('table')

        df = pd.read_html(str(tables[0]))[0]

        player = df[ df['Player']==(last_name+', '+first_name)]

        if len(player)>1:
            player = player[ player['Pos']==playerPos]
        
        return player
    except:
        print("# ERROR:")
        return []

In [39]:
driver = webdriver.Firefox()

driver.get('https://www.footballdb.com/players/players.html?q=develin')

In [40]:
player_list = []

for player in unfins:
    current = powerups.iloc[player]
    first, last, pos = current['firstName'], current['lastName'], current['POS2']
    
    try:
        player_list.append(get_player_teams(first, last, pos, driver))
    except:
        print('# ERROR #')
    time.sleep(1)

In [44]:
player_list_df = pd.concat(player_list)
player_list_df.to_csv('player_list_oct13.csv')

In [46]:
player_list_df.shape

(27, 4)

In [92]:
player_list_df['Player'].values

array(['Reed, Ed', 'Barber, Ronde', 'Dawson, Dermontti', 'George, Eddie',
       'Greene, Kevin', 'McNabb, Donovan', 'Ogden, Jonathan',
       'Sanders, Deion', 'Taylor, Lawrence', 'Allen, Larry',
       'Dawkins, Brian', 'Gonzalez, Tony', 'Randle, John',
       'Sanders, Barry', 'Williams, Aeneas', 'Carr, Derek',
       "Hightower, Dont'a", 'Mahomes, Patrick', 'Marino, Dan',
       'Owens, Terrell', 'Urlacher, Brian', 'Woodson, Rod',
       'Shazier, Ryan', 'Lewis, Ray', 'Rice, Jerry', 'Sharpe, Shannon',
       'Strahan, Michael'], dtype=object)

In [69]:
names = []

for _ in x:
    names.append(_[1].strip() + ' ' + _[0])

In [87]:
player_list_df['Name'] = player_list_df['Player'].str.split(',').values

In [88]:
player_list_df.head()

Unnamed: 0,Player,Pos,College,Teams,Name
14,"Reed, Ed",DB,Miami,"2002-2012 Bal, 2013 Hou, 2013 NYJ","[Reed, Ed]"
16,"Barber, Ronde",DB,Virginia,1997-2012 TB,"[Barber, Ronde]"
4,"Dawson, Dermontti",C,Kentucky,1988-2000 Pit,"[Dawson, Dermontti]"
3,"George, Eddie",RB,Ohio State,"1996 Hou, 1997-2003 Ten, 2004 Dal","[George, Eddie]"
16,"Greene, Kevin",LB,Auburn,"1985-1992 LA, 1993-1995 Pit, 1996 Car, 1997 SF...","[Greene, Kevin]"


In [103]:
previous_df

Unnamed: 0,Name,OVR,POS,PS4,firstName,lastName,POS2,Player,Pos,College,...,Oak,Phi,Pit,SF,Sea,TB,Ten,Was,RAMS,CHARGERS
0,Champ Bailey,73,CB,2000,Champ,Bailey,DB,"Bailey, Champ",DB,Georgia,...,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0,0
1,Randy Moss,73,WR,3400,Randy,Moss,WR,"Moss, Randy",WR,Marshall,...,1.0,0.0,0.0,1.0,0.0,0.0,1.0,0.0,0,0
2,Michael Vick,73,QB,4100,Michael,Vick,QB,"Vick, Michael",QB,Virginia Tech,...,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0,0
3,Reggie White,73,LE,1900,Reggie,White,DE,"White, Reggie",DE,Tennessee,...,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0
4,Derrick Brooks,72,ROLB,2800,Derrick,Brooks,LB,"Brooks, Derrick",LB,Florida State,...,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0,0
5,Ted Hendricks,72,LOLB,1800,Ted,Hendricks,LB,"Hendricks, Ted",LB,Miami,...,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1,0
6,Steve Hutchinson,72,LG,2600,Steve,Hutchinson,OG,"Hutchinson, Steve",OG,Michigan,...,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0,0
7,Lorenzo Neal,72,FB,4000,Lorenzo,Neal,RB,"Neal, Lorenzo",RB,Fresno State,...,0.0,0.0,0.0,0.0,0.0,1.0,1.0,0.0,0,1
8,Willie Roaf,72,LT,1500,Willie,Roaf,OT,"Roaf, Willie",OT,Louisiana Tech,...,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0
9,Bruce Smith,72,RE,2200,Bruce,Smith,DE,"Smith, Bruce",DE,Virginia Tech,...,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0,0


In [101]:
new_names = []

for _ in list(player_list_df['Name'].values):
    #t = ''.join(_)
    t = _[1].strip() + ' ' + _[0]
    new_names.append(t)
    print(t)

Ed Reed
Ronde Barber
Dermontti Dawson
Eddie George
Kevin Greene
Donovan McNabb
Jonathan Ogden
Deion Sanders
Lawrence Taylor
Larry Allen
Brian Dawkins
Tony Gonzalez
John Randle
Barry Sanders
Aeneas Williams
Derek Carr
Dont'a Hightower
Patrick Mahomes
Dan Marino
Terrell Owens
Brian Urlacher
Rod Woodson
Ryan Shazier
Ray Lewis
Jerry Rice
Shannon Sharpe
Michael Strahan


In [102]:
A = set(new_names)
B = set(d2)
A.symmetric_difference(B)

{'DeMarcus Ware',
 'Ha Ha Clinton-Dix',
 'Ricky Williams',
 'Steve Smith Sr',
 'Terrell Davis',
 'Tim Brown'}

In [47]:
player_plist_a = pd.read_csv('/Users/mattjohnson/Desktop/Python2018/MUT/player_list.csv')

In [49]:
player_list_a.drop('Unnamed: 0', axis=1, inplace=True)
print(player_list_a.shape)
player_list_a.head()

(122, 4)


Unnamed: 0,Player,Pos,College,Teams
0,"Hendricks, Ted",LB,Miami,"1969-1973 Bal, 1974 GB, 1975-1981 Oak, 1982-19..."
1,"Roaf, Willie",OT,Louisiana Tech,"1993-2001 NO, 2002-2005 KC"
2,"Smith, Bruce",DE,Virginia Tech,"1985-1999 Buf, 2000-2003 Was"
3,"Taylor, Sean",DB,Miami,2004-2007 Was
4,"Adams, Jamal",DB,Louisiana State,2017-2018 NYJ


In [120]:
player_list_df.shape

(15, 4)

In [122]:
all_data = pd.concat([player_list_a, player_list_df])

In [None]:
list(all_data[''])

In [123]:
all_data

Unnamed: 0,Player,Pos,College,Teams
0,"Hendricks, Ted",LB,Miami,"1969-1973 Bal, 1974 GB, 1975-1981 Oak, 1982-19..."
1,"Roaf, Willie",OT,Louisiana Tech,"1993-2001 NO, 2002-2005 KC"
2,"Smith, Bruce",DE,Virginia Tech,"1985-1999 Buf, 2000-2003 Was"
3,"Taylor, Sean",DB,Miami,2004-2007 Was
4,"Adams, Jamal",DB,Louisiana State,2017-2018 NYJ
5,"Amos, Adrian",DB,Penn State,2015-2018 Chi
6,"Atkins, Geno",DT,Georgia,2010-2018 Cin
7,"Barr, Anthony",LB,UCLA,2014-2018 Min
8,"Berry, Eric",DB,Tennessee,2010-2018 KC
9,"Bosa, Joey",DE,Ohio State,"2016 SD, 2017-2018 LAC"


In [184]:
all_data['Player'] = all_data['lastName'] + ', '+ all_data['firstName']

merged_df = pd.merge(all_data, player_list, on='Player', how='outer')

In [190]:
fins = all_data[ all_data['empty']==0].index

driver = webdriver.Firefox()

driver.get('https://www.footballdb.com/players/players.html?q=develin')

In [108]:
player_list2 = []

for player in unfins:
    current = all_data.iloc[player]
    first, last, pos = current['firstName'], current['lastName'], current['POS2']
    
    try:
        player_list2.append(get_player_teams(first, last, pos, driver))
    except:
        print('# ERROR #')
    time.sleep(1)

NameError: name 'all_data' is not defined

In [None]:
players2 = pd.concat(player_list2)
player_df = pd.concat([players2.reset_index(drop=True), player_list.reset_index(drop=True)])

In [205]:
player_df.shape

(141, 4)

In [None]:
powerups['Player'] = powerups['lastName'] + ', '+ powerups['firstName']

In [212]:
all_players = set(powerups['Player'].unique())
some_players = set(player_df['Player'].unique())

In [213]:
C = all_players.difference(some_players)

In [235]:
merged = pd.merge(powerups, player_df, on='Player', how='outer')
merged['Teams'] = merged['Teams'].fillna(' ')
merged['Teams'] = merged['Teams'].str.replace('[^a-zA-Z,]', '')

In [285]:
df = merged.Teams.str.split('\s*,\s*', expand=True)\
                .apply(pd.Series.value_counts, 1).iloc[:, 1:].fillna(0)
    
df['LAR'] = df['LA'] + df['LAR'] 
df['RAMS'] = np.where(df['LAR']+df['Stl']>=1, 1, 0)

df['CHARGERS'] = np.where(df['LAC']+df['SD']>=1, 1, 0)

df.drop(['LA', 'NFLEHam', 'Stl', 'LAC', 'LAR', 'SD'], axis=1, inplace=True)

In [286]:
all_df = pd.concat([merged, df], axis=1)
#all_df.to_csv('all_powerups.csv')

In [284]:
remaining = ['Beckham Jr, Odell', 'Brown, Zach', 'Gurley II, Todd', 'Harris Jr, Chris',
 'Harrison Sr, Damon', 'Johnson, Lane', 'Johnson, Trumaine', 'Jones, Reshad', 'Slay Jr, Darius',
 'Smith, Jimmy', 'Smith, Telvin', 'Smith, Tyron', 'Tate III, Golden', 'Thomas III, Earl',
 'Williams, Trent']

rem_teams = [['NYG'], ['Ten', 'Buf', 'Was'], ['RAMS'], ['Den'], ['NYJ', 'NYG'], ['Phi'],
            ['RAMS', 'NYJ'], ['Mia'], ['Det'], ['Bal'], ['Jax'], ['Dal'], ['Sea', 'Det'], 
            ['Sea'], ['Was']]

In [288]:
all_df.to_csv('aug17_final_d')

Unnamed: 0,Name,OVR,POS,PS4,firstName,lastName,POS2,Player,Pos,College,...,Oak,Phi,Pit,SF,Sea,TB,Ten,Was,RAMS,CHARGERS
0,Champ Bailey,73,CB,2000,Champ,Bailey,DB,"Bailey, Champ",DB,Georgia,...,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0,0
1,Randy Moss,73,WR,3400,Randy,Moss,WR,"Moss, Randy",WR,Marshall,...,1.0,0.0,0.0,1.0,0.0,0.0,1.0,0.0,0,0
2,Michael Vick,73,QB,4100,Michael,Vick,QB,"Vick, Michael",QB,Virginia Tech,...,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0,0
3,Reggie White,73,LE,1900,Reggie,White,DE,"White, Reggie",DE,Tennessee,...,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0
4,Derrick Brooks,72,ROLB,2800,Derrick,Brooks,LB,"Brooks, Derrick",LB,Florida State,...,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0,0
