In [72]:
import os
import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns
from scipy import stats as sp
import csv

In [29]:
raw_data_path = 'data/'

prior = pd.read_csv(raw_data_path + 'results.csv')
fifa_dataset = pd.read_csv(raw_data_path + 'CompleteDataset.csv')

qualified_countries = ['Egypt', 'Morocco', 'Nigeria', 'Senegal', 'Tunisia', 'Australia', 'Iran', 'Japan', 'Korea Republic', 'Saudi Arabia', 'Belgium', 'Croatia', 'Denmark', 'England', 'France', 'Germany', 'Iceland', 'Poland', 'Portugal', 'Russia', 'Serbia', 'Spain', 'Sweden', 'Switzerland', 'Costa Rica', 'Mexico', 'Panama', 'Argentina', 'Brazil', 'Colombia', 'Peru', 'Uruguay']

In [30]:
fifa_dataset.drop(labels = ['Unnamed: 0', 'Age', 'Photo', 'Flag', 'Club', 'Club Logo', 'Wage'], axis = 1, inplace = True)

prior.drop(labels = ['city', 'country', 'tournament'], axis = 1, inplace = True)
prior = prior[prior.date > '1990-01-01']

In [31]:
# get qualified countries only
fifa_dataset = fifa_dataset[fifa_dataset['Nationality'].isin(qualified_countries)].fillna(0)

prior = prior[(prior['home_team'].isin(qualified_countries) & prior['away_team'].isin(qualified_countries))]

# get remaining potential
fifa_dataset['Remaining Potential'] = fifa_dataset['Potential'] - fifa_dataset['Overall']

# get only one preferred position (first only)
fifa_dataset['Preferred Position'] = fifa_dataset['Preferred Positions'].str.split().str[0]

In [32]:
squad_352_strict = ['GK', 'LB|LWB', 'CB', 'RB|RWB', 'LM|W$', 'RM|W$', 'CM', 'CM|CAM|CDM', 'CM|CAM|CDM', 'W$|T$', 'W$|T$']
squad_442_strict = ['GK', 'LB|LWB', 'CB', 'CB', 'RB|RWB', 'LM|W$', 'RM|W$', 'CM', 'CM|CAM|CDM', 'W$|T$', 'W$|T$']
squad_433_strict = ['GK', 'LB|LWB', 'CB', 'CB', 'RB|RWB', 'CM|LM|W$', 'CM|RM|W$', 'CM|CAM|CDM', 'W$|T$', 'W$|T$', 'W$|T$']
squad_343_strict = ['GK', 'LB|LWB', 'CB', 'RB|RWB', 'LM|W$', 'RM|W$', 'CM|CAM|CDM', 'CM|CAM|CDM', 'W$|T$', 'W$|T$', 'W$|T$']
squad_532_strict = ['GK', 'LB|LWB', 'CB|LWB|RWB', 'CB|LWB|RWB', 'CB|LWB|RWB', 'RB|RWB', 'M$|W$', 'M$|W$', 'M$|W$', 'W$|T$', 'W$|T$']

squad_352_adj = ['GK', 'B$', 'B$', 'B$', 'M$|W$|T$', 'M$|W$|T$', 'M$|W$|T$', 'M$|W$|T$', 'M$|W$|T$', 'W$|T$|M$', 'W$|T$|M$']
squad_442_adj = ['GK', 'B$', 'B$', 'B$', 'B$', 'M$|W$|T$', 'M$|W$|T$', 'M$|W$|T$', 'M$|W$|T$', 'W$|T$|M$', 'W$|T$|M$']
squad_433_adj = ['GK', 'B$', 'B$', 'B$', 'B$', 'M$|W$|T$', 'M$|W$|T$', 'M$|W$|T$', 'W$|T$|M$', 'W$|T$|M$', 'W$|T$|M$']
squad_343_adj = ['GK', 'B$', 'B$', 'B$', 'M$|W$|T$', 'M$|W$|T$', 'M$|W$|T$', 'M$|W$|T$', 'W$|T$|M$', 'W$|T$|M$', 'W$|T$|M$']
squad_532_adj = ['GK', 'B$', 'B$', 'B$', 'B$', 'B$', 'M$|W$|T$', 'M$|W$|T$', 'M$|W$|T$', 'W$|T$|M$', 'W$|T$|M$']

midfield = ['CDM', 'CM', 'RM', 'LM']
defense = ['GK', 'LB', 'CB', 'RB', 'LWB', 'RWB']
attack = ['LW', 'RW', 'ST', 'CAM']

squad_list_strict = [squad_352_strict, squad_442_strict, squad_433_strict, squad_343_strict, squad_532_strict]
squad_list_adj = [squad_352_adj, squad_442_adj, squad_433_adj, squad_343_adj, squad_532_adj]
squad_name = ['3-5-2', '4-4-2', '4-3-3', '3-4-3', '5-3-2']

In [33]:
def get_best_squad_n(position, nationality, df, measurement = 'Potential'):
    df_copy = df.copy()
    df_copy = df_copy[df_copy['Nationality'] == nationality]
    store = []
    team = []
    for i in position:
        store.append([df_copy.loc[[df_copy[df_copy['Preferred Position'].str.contains(i)][measurement].idxmax()]]['Preferred Position'].to_string(index = False), df_copy[df_copy['Preferred Position'].str.contains(i)][measurement].max()])
        team.append(df_copy.loc[[df_copy[df_copy['Preferred Position'].str.contains(i)][measurement].idxmax()]]['Name'].to_string(index = False))
        df_copy.drop(df_copy[df_copy['Preferred Position'].str.contains(i)][measurement].idxmax(), inplace = True)
    return np.mean([x[1] for x in store]).round(2), np.array(team), pd.DataFrame(np.array(store).reshape(11,2), columns = ['Position', measurement]).to_string(index = False)

def get_best_formation_all(squad_list, country):
    best_rating = 0
    best_squad, best_formation = [], []
    for i, formation in enumerate(squad_list):
        #curRating, cur_squad = get_best_squad_n(formation, country, fifa_dataset, 'Overall')
        potRating, pot_squad, squad_info = get_best_squad_n(formation, country, fifa_dataset, 'Potential')
        if potRating > best_rating:
            best_rating = potRating
            best_squad = pot_squad
            best_formation = squad_name[i]
    return best_rating, best_squad, best_formation, squad_info
    
def get_team_stats(squad_stats):
    midRating, defRating, attRating  = [], [], []
    for player in squad_stats.split('\n'):
        pos, rating = player.split()[0], player.split()[-1]
        if pos in midfield: midRating.append(float(rating))
        if pos in defense: defRating.append(float(rating))
        if pos in attack: attRating.append(float(rating))
    return np.mean(midRating).round(2), np.mean(defRating).round(2), np.mean(attRating).round(2)

In [34]:
# create data-set with team information
def make_team_dataframe():
    d = []
    for country in qualified_countries:
            best_rating, best_squad, best_formation, squad_stats = get_best_formation_all(squad_list_adj, country)
            mid_rating, def_rating, att_rating = get_team_stats(squad_stats)
            if best_rating > 84.0: tier = 1
            elif best_rating > 77.0: tier = 2
            else: tier = 3
            d.append({'Country': country, 'Rating': best_rating, 'Squad': best_squad, 'Defence': def_rating, 'Midfield': mid_rating, 'Attack': att_rating, 'Formation': best_formation,'Tier': tier})

    processed_data = pd.DataFrame(d).reindex_axis(['Country', 'Squad', 'Formation', 'Tier', 'Rating', 'Attack', 'Midfield', 'Defence'], axis = 1).set_index('Country')
    processed_data.to_csv('data/WC18_processed.csv', index_label = False)

In [22]:
d = []
for country in qualified_countries:
        best_rating, best_squad, best_formation, squad_stats = get_best_formation_all(squad_list_adj, country)
        mid_rating, def_rating, att_rating = get_team_stats(squad_stats)
        if best_rating > 84.0: tier = 1
        elif best_rating > 77.0: tier = 2
        else: tier = 3
        d.append({'Country': country, 'Rating': best_rating, 'Squad': best_squad, 'Defence': def_rating, 'Midfield': mid_rating, 'Attack': att_rating, 'Formation': best_formation,'Tier': tier})

processed_data = pd.DataFrame(d).reindex_axis(['Country', 'Squad', 'Formation', 'Tier', 'Rating', 'Attack', 'Midfield', 'Defence'], axis = 1).set_index('Country')
#print processed_data

                                                            Squad Formation  \
Country                                                                       
Egypt           [A. El-Shenawy, A. Hegazy, K. Hafez, O. Gaber,...     3-5-2   
Morocco         [Y. Bounou, M. Benatia, A. Hakimi, Z. Feddal, ...     3-5-2   
Nigeria         [V. Enyeama, C. Awaziem, K. Omeruo, U. Agbo, O...     3-5-2   
Senegal         [A. Gomis, K. Koulibaly, K. Mbodj, K. Mbodj, K...     3-5-2   
Tunisia         [F. Ben Mustapha, A. Abdennour, Y. Benalouane,...     3-5-2   
Australia       [M. Ryan, A. Gersbach, T. Sainsbury, B. Wright...     3-5-2   
Iran            [A. Haghighi, M. Mohammadi, K. Ansarifard, K. ...     3-5-2   
Japan           [K. Nakamura, G. Shoji, N. Ueda, M. Hasebe, Y....     3-5-2   
Korea Republic  [Yoon Bo Sang, Kim Min Jae, An Hyeon Beom, Kim...     3-5-2   
Saudi Arabia    [M. Al Owais, M. Hawsawi, O. Hawsawi, Y. Al Sh...     4-4-2   
Belgium         [T. Courtois, T. Alderweireld, L. De

In [77]:
#pdata = make_team_dataframe()
#print pdata#.head(10)
# for each team: goals scored, goals allowed, wins, loses, win difference, per year
# for each year: total num goals, goal differential,
#team.append(df_copy.loc[[df_copy[df_copy['Preferred Position'].str.contains(i)][measurement].idxmax()]]['Name'].to_string(index = False))

#print prior.head(5)
pGF = prior[(prior['home_team'] == 'Germany') & (prior['away_team'] == 'France')]['home_score'].to_string(index = False).split('\n')
#sp.mode(np.array(map(int, pGF)))
m, count = sp.mode(map(int, pGF))
print m
#pGF = np.mean(prior[(prior['home_team'] == 'Germany') & (prior['away_team'] == 'France')]['away_score'].to_string(index = False))
#pFG = prior[(prior['home_team'] == 'France') & (prior['away_team'] == 'Germany')]

#[fifa_dataset[fifa_dataset['Preferred Position'].str.contains('RM')]['Potential'].idxmax()]
#fifa_dataset[fifa_dataset['Preferred Position'].str.contains('GK')]
#,'-', prior[(prior['home_team'] == 'Germany') & (prior['away_team'] == 'France')]
#print prior[(prior.home_team == 'Germany') & (prior.away_team == 'France')]#.home_score
#print prior[(prior['home_team'] == 'Germany') & (prior['away_team'] == 'France')]
#for g in prior[(prior['home_team'] == 'Germany') & (prior['away_team'] == 'France')].iterrows():
#    print g#.home_score, '-', g.away_score
#prior[(prior['home_team'] == 'Germany') & (prior['away_team'] == 'France')].home_score

[0]


In [27]:
for countryA in qualified_countries:
    for countryB in qualified_countries:
        if countryA == countryB: continue
        print #countryA, ' vs ', countryB
        print prior[(prior['home_team'] == countryA) & (prior['away_team'] == countryB)]#.home_score.get_value(), '-', prior[(prior['home_team'] == countryA) & (prior['away_team'] == countryB)].away_score
    


# --------
def single_game(A, B):
    xAB = prior[prior.home_team == A].home_score



             date home_team away_team  home_score  away_score
23310  2001-01-28     Egypt   Morocco           0           0
27746  2006-01-24     Egypt   Morocco           0           0
37951  2017-01-29     Egypt   Morocco           1           0

             date home_team away_team  home_score  away_score
31436  2010-01-12     Egypt   Nigeria           3           1
33470  2012-04-12     Egypt   Nigeria           3           2
37185  2016-03-29     Egypt   Nigeria           1           0

             date home_team away_team  home_score  away_score
22268  2000-01-28     Egypt   Senegal           1           0
23675  2001-05-06     Egypt   Senegal           1           0
24282  2002-01-20     Egypt   Senegal           0           1
25647  2003-10-10     Egypt   Senegal           1           0
27718  2005-12-29     Egypt   Senegal           4           2
27778  2006-02-07     Egypt   Senegal           2           1
35957  2014-11-15     Egypt   Senegal           0           1

    

Empty DataFrame
Columns: [date, home_team, away_team, home_score, away_score]
Index: []

Empty DataFrame
Columns: [date, home_team, away_team, home_score, away_score]
Index: []

             date home_team       away_team  home_score  away_score
31709  2010-06-22   Nigeria  Korea Republic           2           2

             date home_team     away_team  home_score  away_score
31598  2010-05-25   Nigeria  Saudi Arabia           0           0

Empty DataFrame
Columns: [date, home_team, away_team, home_score, away_score]
Index: []

Empty DataFrame
Columns: [date, home_team, away_team, home_score, away_score]
Index: []

Empty DataFrame
Columns: [date, home_team, away_team, home_score, away_score]
Index: []

             date home_team away_team  home_score  away_score
24570  2002-06-12   Nigeria   England           0           0

Empty DataFrame
Columns: [date, home_team, away_team, home_score, away_score]
Index: []

Empty DataFrame
Columns: [date, home_team, away_team, home_score, away_


             date       home_team away_team  home_score  away_score
24515  2002-05-21  Korea Republic   England           1           1

             date       home_team away_team  home_score  away_score
24528  2002-05-26  Korea Republic    France           2           3

             date       home_team away_team  home_score  away_score
26929  2004-12-19  Korea Republic   Germany           3           1

Empty DataFrame
Columns: [date, home_team, away_team, home_score, away_score]
Index: []

             date       home_team away_team  home_score  away_score
24543  2002-06-04  Korea Republic    Poland           2           0
33013  2011-10-07  Korea Republic    Poland           2           2

Empty DataFrame
Columns: [date, home_team, away_team, home_score, away_score]
Index: []

Empty DataFrame
Columns: [date, home_team, away_team, home_score, away_score]
Index: []

             date       home_team away_team  home_score  away_score
22699  2000-05-28  Korea Republic    Serbia     

36893  2015-11-13    France   Germany           2           0

             date home_team away_team  home_score  away_score
33523  2012-05-27    France   Iceland           3           2
37496  2016-07-03    France   Iceland           5           2

             date home_team away_team  home_score  away_score
22384  2000-02-23    France    Poland           1           0
26800  2004-11-17    France    Poland           0           0

             date home_team away_team  home_score  away_score
22842  2000-06-28    France  Portugal           2           1
23624  2001-04-25    France  Portugal           4           0
35812  2014-10-11    France  Portugal           2           1

             date home_team away_team  home_score  away_score
24446  2002-04-17    France    Russia           0           0
37189  2016-03-29    France    Russia           4           2

             date home_team away_team  home_score  away_score
24871  2002-11-20    France    Serbia           3           0
302

Index: []

Empty DataFrame
Columns: [date, home_team, away_team, home_score, away_score]
Index: []

             date home_team  away_team  home_score  away_score
31040  2009-08-12    Russia  Argentina           2           3
38626  2017-11-11    Russia  Argentina           0           1

             date home_team away_team  home_score  away_score
27853  2006-03-01    Russia    Brazil           0           1
34536  2013-03-25    Russia    Brazil           1           1

Empty DataFrame
Columns: [date, home_team, away_team, home_score, away_score]
Index: []

Empty DataFrame
Columns: [date, home_team, away_team, home_score, away_score]
Index: []

             date home_team away_team  home_score  away_score
33500  2012-05-25    Russia   Uruguay           1           1

Empty DataFrame
Columns: [date, home_team, away_team, home_score, away_score]
Index: []

Empty DataFrame
Columns: [date, home_team, away_team, home_score, away_score]
Index: []

Empty DataFrame
Columns: [date, home_team,

In [286]:
processed_data

Unnamed: 0_level_0,Squad,Formation,Tier,Rating,Attack,Midfield,Defence
Country,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1
Egypt,"[A. El-Shenawy, A. Hegazy, K. Hafez, O. Gaber,...",3-5-2,2,79.0,82.33,83.0,74.17
Morocco,"[Y. Bounou, M. Benatia, A. Hakimi, Z. Feddal, ...",3-5-2,2,81.55,84.0,82.5,78.83
Nigeria,"[V. Enyeama, C. Awaziem, K. Omeruo, U. Agbo, O...",3-5-2,2,82.82,84.5,85.33,79.0
Senegal,"[A. Gomis, K. Koulibaly, K. Mbodj, K. Mbodj, K...",3-5-2,1,84.18,87.25,84.0,81.17
Tunisia,"[F. Ben Mustapha, A. Abdennour, Y. Benalouane,...",3-5-2,3,74.45,78.0,76.0,72.33
Australia,"[M. Ryan, A. Gersbach, T. Sainsbury, B. Wright...",3-5-2,2,77.82,77.33,78.5,77.5
Iran,"[A. Haghighi, M. Mohammadi, K. Ansarifard, K. ...",3-5-2,3,76.55,79.75,79.0,71.67
Japan,"[K. Nakamura, G. Shoji, N. Ueda, M. Hasebe, Y....",3-5-2,2,79.55,80.5,81.0,77.67
Korea Republic,"[Yoon Bo Sang, Kim Min Jae, An Hyeon Beom, Kim...",3-5-2,2,80.36,82.0,79.0,78.83
Saudi Arabia,"[M. Al Owais, M. Hawsawi, O. Hawsawi, Y. Al Sh...",4-4-2,2,77.45,79.33,77.0,76.5


In [261]:
def get_country_squad(country):
    return fifa_dataset[fifa_dataset['Nationality'] == country]

#panama = get_country_squad('Panama')
#print panama
#print panama['Preferred Position']
#print iran['Preferred Position'].unique()
squad_list = [squad_352_strict, squad_442_strict, squad_433_strict, squad_343_strict, squad_532_strict]
squad_name = ['3-5-2', '4-4-2', '4-3-3', '3-4-3', '5-3-2']

#best_rating, best_squad, best_formation = get_best_formation_all(squad_list, 'Germany')
#print best_rating, best_squad, best_formation
#a,b = get_best_squad_n(squad_532_adj, 'Germany', fifa_dataset)
#print a,b
# for i, sq in enumerate(squad_list_adj):
#     print squad_name[i]
#     a,b = get_best_squad_n(sq, 'France', fifa_dataset)
#     print a, b

#print get_country_squad('France')

#rate, saudi, form, info = get_best_formation_all(squad_list_adj, 'Saudi Arabia')
#print saudi
#print rate, saudi, form, info
#
best_rating, best_squad, best_formation, squad_stats = get_best_formation_all(squad_list_adj, 'Senegal')
print get_team_stats(squad_stats)

#print info.split('\n')#[1:11]
# print team

Position Potential
GK 81
CB 87
CB 80
CB 80
CB 80
RB 79
ST 90
LW 87
CAM 87
ST 85
CM 84
(84.0, 81.170000000000002, 87.25)


In [284]:
# #print prior.head(5)
# #print fifa_dataset.tail(5)
# print 
# #print prior.shape
# saudi = fifa_dataset[fifa_dataset['Nationality'] == 'Saudi Arabia']
# print saudi

p=pd.DataFrame(d).reindex_axis(['Country', 'Squad', 'Formation', 'Tier', 'Rating', 'Attack', 'Midfield', 'Defence'], axis = 1).set_index('Country')
p.index.get_values()


array(['Egypt', 'Morocco', 'Nigeria', 'Senegal', 'Tunisia', 'Australia',
       'Iran', 'Japan', 'Korea Republic', 'Saudi Arabia', 'Belgium',
       'Croatia', 'Denmark', 'England', 'France', 'Germany', 'Iceland',
       'Poland', 'Portugal', 'Russia', 'Serbia', 'Spain', 'Sweden',
       'Switzerland', 'Costa Rica', 'Mexico', 'Panama', 'Argentina',
       'Brazil', 'Colombia', 'Peru', 'Uruguay'], dtype=object)

In [210]:


#best_rating, best_squad, best_formation = get_best_formation_all(squad_list, 'Germany')
#print best_rating, best_squad, best_formation



#print best_squad
#get_team_stats(best_squad)
# --- 
#with open()


#------------

# def _pref(x):
#     prefs = temp.get_value(x,'Preferred Positions')
#     attr = []
#     if len(prefs)>1:
#         for i in prefs:
#              t = temp.get_value(x,i)
#              attr.append(t)
#         maxval = max(attr)
#         idx = attr.index(maxval)
#         return prefs[idx]
#     else:
#         return prefs[0]

# rating_352_EN_Overall, best_list_352_EN_Overall = get_best_squad_n(squad_352_strict, curCountry, fifa_dataset, 'Overall')
# rating_352_EN_Potential, best_list_352_EN_Potential = get_best_squad_n(squad_352_strict, curCountry, fifa_dataset,'Potential')

# # 
# print('-Overall-')
# print('Average rating: {:.1f}'.format(rating_352_EN_Overall))
# print(best_list_352_EN_Overall)

# print('-Potential-')
# print('Average rating: {:.1f}'.format(rating_352_EN_Potential))
# print(best_list_352_EN_Potential)

ValueError: too many values to unpack

In [170]:
#np.histogram(scores,3)
#print scores
c=[]
for score in scores:
    if score < 77.: c.append(3)
    elif score < 84.: c.append(2)
    else: c.append(1)

#for s in list(zip(scores, c)): print s
print best_squad.split()

[u'Position', u'Player', u'Potential', u'GK', u'F.', u'Muslera', u'82', u'CB', u'D.', u'God\xedn', u'88', u'CB', u'J.', u'Gim\xe9nez', u'87', u'LWB', u'M.', u'Saracchi', u'85', u'ST', u'L.', u'Su\xe1rez', u'92', u'ST', u'E.', u'Cavani', u'87', u'CM', u'N.', u'N\xe1ndez', u'85', u'RM', u'F.', u'Valverde', u'85', u'CDM', u'M.', u'Lemos', u'83', u'CM', u'L.', u'Torreira', u'83', u'CM', u'R.', u'Bentancur', u'83']


In [179]:
#temp.set_index('Country')
temp = pd.DataFrame(d)
temp.set_index('Country')

Unnamed: 0_level_0,Attack,Defence,Midfield,Overall Rating,Squad,Tier
Country,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1
Egypt,82.33,75.5,81.0,79.0,Position Player Potential\n GK A....,2
Morocco,83.25,79.5,82.5,81.55,Position Player Potential\n GK ...,2
Nigeria,84.0,80.0,85.33,82.82,Position Player Potential\n GK V...,2
Senegal,87.25,82.0,83.5,84.18,Position Player Potential\n G...,1
Tunisia,78.0,72.5,75.25,74.45,Position Player Potential\n GK ...,3
Australia,77.25,78.25,78.5,77.82,Position Player Potential\n GK ...,2
Iran,79.75,74.5,76.5,76.55,Position Player Potential\n GK...,3
Japan,80.5,78.0,80.5,79.55,Position Player Potential\n GK K....,2
Korea Republic,82.0,79.75,79.0,80.36,Position Player Potential\n GK ...,2
Saudi Arabia,79.33,76.8,77.0,77.45,Position Player Potential\n GK ...,2


In [15]:
df.index

Index([u'Cristiano Ronaldo', u'L. Messi', u'Neymar', u'L. Suárez', u'M. Neuer',
       u'R. Lewandowski', u'De Gea', u'E. Hazard', u'T. Kroos', u'G. Higuaín',
       ...
       u'R. White', u'A. Conway', u'T. Sawyer', u'J. Keeble', u'T. Käßemodel',
       u'A. Kelsey', u'B. Richardson', u'J. Young', u'J. Lundstram',
       u'L. Sackey'],
      dtype='object', name=u'Name', length=17981)

In [21]:
# Egypt = fifa_dataset[fifa_dataset['Nationality']=='Egypt']
# Morocco = fifa_dataset[fifa_dataset['Nationality']=='Morocco']
# Nigeria = fifa_dataset[fifa_dataset['Nationality']=='Nigeria']
# Senegal = fifa_dataset[fifa_dataset['Nationality']=='Senegal']
# Tunisia = fifa_dataset[fifa_dataset['Nationality']=='Tunisia']
# Australia = fifa_dataset[fifa_dataset['Nationality']=='Australia']
# Iran = fifa_dataset[fifa_dataset['Nationality']=='Iran']
# Japan = fifa_dataset[fifa_dataset['Nationality']=='Japan']
# Korea = fifa_dataset[fifa_dataset['Nationality']=='Korea Republic']
# SaudiArabia = fifa_dataset[fifa_dataset['Nationality']=='Saudi Arabia']
# Belgium = fifa_dataset[fifa_dataset['Nationality']=='Belgium']
# Croatia = fifa_dataset[fifa_dataset['Nationality']=='Croatia']
# Denmark = fifa_dataset[fifa_dataset['Nationality']=='Denmark']
# England = fifa_dataset[fifa_dataset['Nationality']=='England']
# France = fifa_dataset[fifa_dataset['Nationality']=='France']
# Germany = fifa_dataset[fifa_dataset['Nationality']=='Germany']
# Iceland = fifa_dataset[fifa_dataset['Nationality']=='Iceland']
# Poland = fifa_dataset[fifa_dataset['Nationality']=='Poland']
# Portugal = fifa_dataset[fifa_dataset['Nationality']=='Russia']
# Serbia = fifa_dataset[fifa_dataset['Nationality']=='Serbia']
# Spain = fifa_dataset[fifa_dataset['Nationality']=='Spain']
# Switzerland = fifa_dataset[fifa_dataset['Nationality']=='Sweden']
# CostaRica = fifa_dataset[fifa_dataset['Nationality']=='Costa Rica']
# Mexico = fifa_dataset[fifa_dataset['Nationality']=='Mexico']
# Panema = fifa_dataset[fifa_dataset['Nationality']=='Panema']
# Argentina = fifa_dataset[fifa_dataset['Nationality']=='Argentina']
# Brazil = fifa_dataset[fifa_dataset['Nationality']=='Brazil']
# Colombia = fifa_dataset[fifa_dataset['Nationality']=='Colombia']
# Peru = fifa_dataset[fifa_dataset['Nationality']=='Peru']
# Uruguay = fifa_dataset[fifa_dataset['Nationality']=='Uruguay']

Unnamed: 0_level_0,Age,Photo,Nationality,Flag,Overall,Potential,Club,Club Logo,Value,Wage,...,RB,RCB,RCM,RDM,RF,RM,RS,RW,RWB,ST
Name,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
Cristiano Ronaldo,32,https://cdn.sofifa.org/48/18/players/20801.png,Portugal,https://cdn.sofifa.org/flags/38.png,94,94,Real Madrid CF,https://cdn.sofifa.org/24/18/teams/243.png,€95.5M,€565K,...,61.0,53.0,82.0,62.0,91.0,89.0,92.0,91.0,66.0,92.0
L. Messi,30,https://cdn.sofifa.org/48/18/players/158023.png,Argentina,https://cdn.sofifa.org/flags/52.png,93,93,FC Barcelona,https://cdn.sofifa.org/24/18/teams/241.png,€105M,€565K,...,57.0,45.0,84.0,59.0,92.0,90.0,88.0,91.0,62.0,88.0
Neymar,25,https://cdn.sofifa.org/48/18/players/190871.png,Brazil,https://cdn.sofifa.org/flags/54.png,92,94,Paris Saint-Germain,https://cdn.sofifa.org/24/18/teams/73.png,€123M,€280K,...,59.0,46.0,79.0,59.0,88.0,87.0,84.0,89.0,64.0,84.0
L. Suárez,30,https://cdn.sofifa.org/48/18/players/176580.png,Uruguay,https://cdn.sofifa.org/flags/60.png,92,92,FC Barcelona,https://cdn.sofifa.org/24/18/teams/241.png,€97M,€510K,...,64.0,58.0,80.0,65.0,88.0,85.0,88.0,87.0,68.0,88.0
M. Neuer,31,https://cdn.sofifa.org/48/18/players/167495.png,Germany,https://cdn.sofifa.org/flags/21.png,92,92,FC Bayern Munich,https://cdn.sofifa.org/24/18/teams/21.png,€61M,€230K,...,,,,,,,,,,
R. Lewandowski,28,https://cdn.sofifa.org/48/18/players/188545.png,Poland,https://cdn.sofifa.org/flags/37.png,91,91,FC Bayern Munich,https://cdn.sofifa.org/24/18/teams/21.png,€92M,€355K,...,58.0,57.0,78.0,62.0,87.0,82.0,88.0,84.0,61.0,88.0
De Gea,26,https://cdn.sofifa.org/48/18/players/193080.png,Spain,https://cdn.sofifa.org/flags/45.png,90,92,Manchester United,https://cdn.sofifa.org/24/18/teams/11.png,€64.5M,€215K,...,,,,,,,,,,
E. Hazard,26,https://cdn.sofifa.org/48/18/players/183277.png,Belgium,https://cdn.sofifa.org/flags/7.png,90,91,Chelsea,https://cdn.sofifa.org/24/18/teams/5.png,€90.5M,€295K,...,59.0,47.0,81.0,61.0,87.0,87.0,82.0,88.0,64.0,82.0
T. Kroos,27,https://cdn.sofifa.org/48/18/players/182521.png,Germany,https://cdn.sofifa.org/flags/21.png,90,90,Real Madrid CF,https://cdn.sofifa.org/24/18/teams/243.png,€79M,€340K,...,76.0,72.0,87.0,82.0,81.0,81.0,77.0,80.0,78.0,77.0
G. Higuaín,29,https://cdn.sofifa.org/48/18/players/167664.png,Argentina,https://cdn.sofifa.org/flags/52.png,90,90,Juventus,https://cdn.sofifa.org/24/18/teams/45.png,€77M,€275K,...,51.0,46.0,71.0,52.0,84.0,79.0,87.0,82.0,55.0,87.0
