In [1]:
from socceraction.data.wyscout import PublicWyscoutLoader
from socceraction.spadl.wyscout import convert_to_actions as convert_to_actions_wyscout
from socceraction.spadl.statsbomb import convert_to_actions as convert_to_actions_statsbomb
from socceraction.data.opta import OptaLoader
from socceraction.data.statsbomb import StatsBombLoader
from socceraction.spadl.config import actiontypes, bodyparts
import socceraction.spadl as spadl
import pandas as pd
import matplotlib.pyplot as plt
import numpy as np
from sklearn import preprocessing
from sklearn.model_selection import train_test_split
from sklearn.metrics import mean_squared_error, roc_auc_score, brier_score_loss, log_loss, mean_absolute_error, r2_score, mean_absolute_percentage_error
from sklearn.metrics import accuracy_score, precision_score, recall_score, f1_score, matthews_corrcoef, balanced_accuracy_score
from xgboost import XGBClassifier, XGBRegressor
from catboost import CatBoostClassifier
import math
import pickle
import os
from name_matching.name_matcher import NameMatcher
from rapidfuzz import fuzz
from imblearn.over_sampling import RandomOverSampler, SMOTE
from imblearn.under_sampling import RandomUnderSampler
from sklearn.feature_selection import r_regression, SelectKBest, chi2, mutual_info_classif, SequentialFeatureSelector, RFECV, SelectFromModel
from scipy.stats import pearsonr, chisquare
from mrmr import mrmr_classif
from sklearn.neighbors import KNeighborsClassifier
from sklearn.ensemble import RandomForestClassifier, RandomForestRegressor
from sklearn.svm import LinearSVR
from sklearn.linear_model import Lasso, LogisticRegression

In [2]:
# CONFIG FOR EXPERIMENTS SCENARIO
USE_EVALUATION_METRIC_CLASSIFICATION = True
INCLUDE_SKILL_PLAYERS_OPTIONS = [
    False,
    True
]
SAMPLING_OPTIONS = [
    "none",
    "random_oversampled",
    "random_undersampled",
    "smote_oversampled"
]
FEATURE_SELECTION_OPTIONS = [
    "pearson",
    "chisquare",
    "mutualinf",
    "mrmr",
    "rfembedded",
    "lasso"
]
if USE_EVALUATION_METRIC_CLASSIFICATION:
    MODEL_ALGORITHM_OPTIONS = [
        "xgbclassifier",
        "catboostclassifier",
        "rfclassifier"
    ]
else:
    MODEL_ALGORITHM_OPTIONS = [
        "xgbregressor",
        # "rfregressor",
        # "logregression"
    ]
CONFIG_EXPERIMENTS_SCENARIO_MAP = {}

def construct_config_experiments_scenario_map():
    index_counter = 1
    for include_skill_opt in INCLUDE_SKILL_PLAYERS_OPTIONS:
        for sampling_opt in SAMPLING_OPTIONS:
            if (include_skill_opt == False):
                for algorithm_opt in MODEL_ALGORITHM_OPTIONS:
                    CONFIG_EXPERIMENTS_SCENARIO_MAP[index_counter] = \
                        {"include_skill_opt" : 1 if include_skill_opt else 0, \
                        "sampling_opt" : sampling_opt, \
                        "feature_selection_opt" : "none", \
                        "algorithm_opt" : algorithm_opt}
                    index_counter += 1
            else:
                for feature_selection_opt in FEATURE_SELECTION_OPTIONS:
                    for algorithm_opt in MODEL_ALGORITHM_OPTIONS:
                        CONFIG_EXPERIMENTS_SCENARIO_MAP[index_counter] = \
                            {"include_skill_opt" : 1 if include_skill_opt else 0, \
                            "sampling_opt" : sampling_opt, \
                            "feature_selection_opt" : feature_selection_opt, \
                            "algorithm_opt" : algorithm_opt}
                        index_counter += 1

construct_config_experiments_scenario_map()

In [3]:
# COLUMNS FOR TEST EXPERIMENT RESULT
COLUMNS_EVALUATION_METRIC_CLASSIFICATION = [
    "rec_score",
    "prec_score",
    "F1_score",
    "acc_score",
    "auc_score",
    "mcc_score",
    "brier_score",
    "log_loss_score",
    "balanced_acc_score"
]
COLUMNS_EVALUATION_METRIC_REGRESSION = [
    "mean_squared_error_score",
    "root_mean_squared_error_score",
    "auc_score",
    "brier_score",
    "log_loss_score",
    "mean_absolute_error_score",
    "r_squared_score",
    "mean_absolute_percentage_error_score"
]
COLUMNS_SCENARIO_NAME = [
    "include_skill_opt",
    "sampling_opt",
    "feature_selection_opt",
    "algorithm_opt"
]
if (USE_EVALUATION_METRIC_CLASSIFICATION):
    COLUMNS_EXPERIMENT_RESULT = ["case_number"] + COLUMNS_SCENARIO_NAME + COLUMNS_EVALUATION_METRIC_CLASSIFICATION
else:
    COLUMNS_EXPERIMENT_RESULT = ["case_number"] + COLUMNS_SCENARIO_NAME + COLUMNS_EVALUATION_METRIC_REGRESSION

In [4]:
api_wyscout = PublicWyscoutLoader(root="data/wyscout")
api_opta = OptaLoader(root="data/opta")
api_statsbomb = StatsBombLoader(root="data/statsbomb", getter="local")

In [5]:
for idx, action_name in enumerate(actiontypes):
    print(f'action_id : {idx}   action_name : {action_name}')

action_id : 0   action_name : pass
action_id : 1   action_name : cross
action_id : 2   action_name : throw_in
action_id : 3   action_name : freekick_crossed
action_id : 4   action_name : freekick_short
action_id : 5   action_name : corner_crossed
action_id : 6   action_name : corner_short
action_id : 7   action_name : take_on
action_id : 8   action_name : foul
action_id : 9   action_name : tackle
action_id : 10   action_name : interception
action_id : 11   action_name : shot
action_id : 12   action_name : shot_penalty
action_id : 13   action_name : shot_freekick
action_id : 14   action_name : keeper_save
action_id : 15   action_name : keeper_claim
action_id : 16   action_name : keeper_punch
action_id : 17   action_name : keeper_pick_up
action_id : 18   action_name : clearance
action_id : 19   action_name : bad_touch
action_id : 20   action_name : non_action
action_id : 21   action_name : dribble
action_id : 22   action_name : goalkick


In [6]:
for idx, bodypart_name in enumerate(bodyparts):
    print(f'bodypart_id : {idx}   bodypart_name : {bodypart_name}')

bodypart_id : 0   bodypart_name : foot
bodypart_id : 1   bodypart_name : head
bodypart_id : 2   bodypart_name : other
bodypart_id : 3   bodypart_name : head/other
bodypart_id : 4   bodypart_name : foot_left
bodypart_id : 5   bodypart_name : foot_right


In [7]:
def convert_events_df_to_spadl(events_df, home_team_id, source):
    if (source == "Statsbomb"):
        spadl_events_df = convert_to_actions_statsbomb(events_df, home_team_id)
    else:
        spadl_events_df = convert_to_actions_wyscout(events_df, home_team_id)
    spadl_events_df['time_seconds'] = spadl_events_df['time_seconds'].astype('float64')
    spadl_events_df['timestamp'] = pd.to_datetime(spadl_events_df['time_seconds'], unit='s')
    return spadl_events_df

In [8]:
# FUNCTION TO ADD ADDITIONAL INFO IN RAW SPADL DATAFRAME
STANDARD_LENGTH_COURT = 105
STANDARD_WIDTH_COURT = 68
STANDARD_GOALLINE_WIDTH = 7.32
STANDARD_LENGTH_COURT_STATSBOMB = 120
STANDARD_WIDTH_COURT_STATSBOMB = 80

# Helper Functions
def calculate_distance_to_goal(length_court, width_court, coordinate_x, coordinate_y, is_home_team):
    if is_home_team:
        distance_to_goal = math.sqrt((abs(length_court - coordinate_x)) ** 2 + (abs((0.5 * width_court) - coordinate_y)) ** 2)
    else:
        distance_to_goal = math.sqrt((coordinate_x) ** 2 + (abs((0.5 * width_court) - coordinate_y)) ** 2)
    return distance_to_goal

def calculate_distance_to_goal_apply_df(row):
    return calculate_distance_to_goal(STANDARD_LENGTH_COURT, STANDARD_WIDTH_COURT, row['start_x'], row['start_y'], row['is_home_team'])

# def calculate_angle_to_goal(goalline_width, length_court, width_court, coordinate_x, coordinate_y, is_home_team):
#     if is_home_team:
#         L = abs(length_court - coordinate_x)
#     else:
#         L = coordinate_x
#     W = abs((0.5 * width_court) - coordinate_y)
#     return math.atan((goalline_width * L) / (L ** 2 + W ** 2 - (goalline_width / 2) ** 2))

def calculate_angle_to_goal_v2(goalline_width, length_court, width_court, coordinate_x, coordinate_y, is_home_team):
    if is_home_team:
        coordinate_x_post_1, coordinate_x_post_2 = (length_court, length_court)
    else:
        coordinate_x_post_1, coordinate_x_post_2 = (0, 0)
    coordinate_y_post_1 = (width_court / 2) + (goalline_width / 2)
    coordinate_y_post_2 = (width_court / 2) - (goalline_width / 2)

    distance_to_post_1 = math.sqrt(abs(coordinate_x - coordinate_x_post_1) ** 2 + abs(coordinate_y - coordinate_y_post_1) ** 2)
    distance_to_post_2 = math.sqrt(abs(coordinate_x - coordinate_x_post_2) ** 2 + abs(coordinate_y - coordinate_y_post_2) ** 2)

    return math.acos((distance_to_post_1 ** 2 + distance_to_post_2 ** 2 - goalline_width ** 2) / (2 * distance_to_post_1 * distance_to_post_2))

def calculate_angle_to_goal_apply_df(row):
    return calculate_angle_to_goal_v2(STANDARD_GOALLINE_WIDTH, STANDARD_LENGTH_COURT, STANDARD_WIDTH_COURT, row['start_x'], row['start_y'], row['is_home_team'])

def filter_out_is_home_team_apply_df(row, home_team_id):
    return 1 if row['team_id'] == home_team_id else 0

# Helper functions specific to statsbomb opponent data
def calculate_distance_between_two_coordinates(x1, y1, x2, y2):
    return math.sqrt(abs(x2-x1) ** 2 + abs(y2-y1) ** 2)

def filter_out_non_opponent_coordinate_freeze_frame(freeze_frame_360_list):
    if (freeze_frame_360_list == None or not isinstance(freeze_frame_360_list, list)):
        return []
    return [x for x in freeze_frame_360_list if x['teammate'] == False and x['actor'] == False]

def convert_statsbomb_coordinate_to_spadl_coordinate(coordinate_x, coordinate_y):
    converted_coordinate_x = (STANDARD_LENGTH_COURT / STANDARD_LENGTH_COURT_STATSBOMB) * coordinate_x
    converted_coordinate_y = (STANDARD_WIDTH_COURT / STANDARD_WIDTH_COURT_STATSBOMB) * coordinate_y
    return (converted_coordinate_x, converted_coordinate_y)

def calculate_distance_opponent_apply_df(row):
    freeze_frame_360_opponents = filter_out_non_opponent_coordinate_freeze_frame(row['freeze_frame_360'])
    list_distance_opponent = []
    for object_loc in freeze_frame_360_opponents:
        opponent_x, opponent_y = convert_statsbomb_coordinate_to_spadl_coordinate(object_loc['location'][0], object_loc['location'][1])
        distance_opponent = calculate_distance_between_two_coordinates(row['start_x'], row['start_y'], opponent_x, opponent_y)
        list_distance_opponent.append(distance_opponent)
    return min(list_distance_opponent) if len(list_distance_opponent) > 0 else 0

def calculate_num_opponent_closer_goal(start_x, start_y, freeze_frame_360, is_home_team):
    freeze_frame_360_opponents = filter_out_non_opponent_coordinate_freeze_frame(freeze_frame_360)
    if (is_home_team):
        coordinate_x_goal = STANDARD_LENGTH_COURT
    else:
        coordinate_x_goal = 0
    coordinate_y_goal = STANDARD_WIDTH_COURT / 2

    num_opponent_closer_to_goal = 0
    for object_loc in freeze_frame_360_opponents:
        opponent_x, opponent_y = convert_statsbomb_coordinate_to_spadl_coordinate(object_loc['location'][0], object_loc['location'][1])
        distance_passer_to_goal = calculate_distance_between_two_coordinates(start_x, start_y, coordinate_x_goal, coordinate_y_goal)
        distance_opponent_to_goal = calculate_distance_between_two_coordinates(opponent_x, opponent_y, coordinate_x_goal, coordinate_y_goal)
        if (distance_opponent_to_goal < distance_passer_to_goal):
            num_opponent_closer_to_goal += 1
    return num_opponent_closer_to_goal

def calculate_num_opponent_closer_goal_apply_df(row, home_team_id):
    return calculate_num_opponent_closer_goal(row['start_x'], row['start_y'], row['freeze_frame_360'], (row['team_id'] == home_team_id))

def calculate_num_opponent_in_path(start_x, start_y, freeze_frame_360):
    path_distance = 10
    freeze_frame_360_opponents = filter_out_non_opponent_coordinate_freeze_frame(freeze_frame_360)
    num_opponent_in_path = 0
    for object_loc in freeze_frame_360_opponents:
        opponent_x, opponent_y = convert_statsbomb_coordinate_to_spadl_coordinate(object_loc['location'][0], object_loc['location'][1])
        distance_with_opponent = calculate_distance_between_two_coordinates(start_x, start_y, opponent_x, opponent_y)
        if (distance_with_opponent <= path_distance):
            num_opponent_in_path += 1
    return num_opponent_in_path

def calculate_num_opponent_in_path_apply_df(row):
    return calculate_num_opponent_in_path(row['start_x'], row['start_y'], row['freeze_frame_360'])

# Add distance to goal column
def add_distance_to_goal_column_to_spadl_df(spadl_df):
    spadl_df['distance_to_goal'] = spadl_df.apply(calculate_distance_to_goal_apply_df, axis=1)
    return spadl_df

# Add angle to goal column 
def add_angle_to_goal_column_to_spadl_df(spadl_df):
    spadl_df['angle_to_goal'] = spadl_df.apply(calculate_angle_to_goal_apply_df, axis=1)
    return spadl_df

# Add is_home_team column (boolean 0/1)
def add_is_home_team_column_to_spadl_df(spadl_df, home_team_id):
    spadl_df['is_home_team'] = spadl_df.apply(lambda x : filter_out_is_home_team_apply_df(x, home_team_id), axis=1)
    return spadl_df

# Opponent Feature 1 : distance opponent
def add_distance_opponent_column_to_spadl_df(spadl_df):
    spadl_df['distance_opponent'] = spadl_df.apply(calculate_distance_opponent_apply_df, axis=1)
    return spadl_df

# Opponent Feature 2 : opponents closer to goal
def add_num_opponent_closer_goal_column_to_spadl_df(spadl_df, home_team_id):
    spadl_df['num_opponent_closer_goal'] = spadl_df.apply(lambda x : calculate_num_opponent_closer_goal_apply_df(x, home_team_id), axis=1)
    return spadl_df

# Opponent Feature 3 : opponents in path
def add_num_opponent_in_path_column_to_spadl_df(spadl_df):
    spadl_df['num_opponent_in_path'] = spadl_df.apply(calculate_num_opponent_in_path_apply_df, axis=1)
    return spadl_df

In [9]:
# Collect all dataset action specific type, export them to csv files
# Shot (action_id = 11), shot_penalty (action_id = 12), shot_freekick (action_id = 13)
SHOT_ACTION_ID = [11, 12, 13] 

def collect_raw_goal_spadl_df(source="Wyscout", period=1):
    if source == "Statsbomb":
        api = api_statsbomb
    else:
        api = api_wyscout
    list_competitions_ids = []
    list_game_ids = []

    competitions_df = api.competitions()
    for _, row in competitions_df.iterrows():
        if source == "Statsbomb":
            if row['competition_gender'] == 'male':
                list_competitions_ids.append((row['competition_id'], row['season_id']))
        else:
            list_competitions_ids.append((row['competition_id'], row['season_id']))
        
    for competition_id, season_id in list_competitions_ids:
        games_df = api.games(competition_id, season_id)
        for _, row in games_df.iterrows():
            list_game_ids.append((row['game_id'], row['home_team_id'], row['away_team_id']))
            
    for game_id, home_team_id, away_team_id in list_game_ids:
        try:
            if (source == "Statsbomb"):
                this_game_events_df = api.events(game_id, load_360=True)
            else:
                this_game_events_df = api.events(game_id)
            this_game_events_spadl_df = convert_events_df_to_spadl(this_game_events_df, home_team_id, source)

            # Add column 360 data into events spadl data (Statsbomb)
            if (source == "Statsbomb"):
                this_game_events_spadl_df = pd.merge(this_game_events_spadl_df, this_game_events_df[["event_id", "visible_area_360", "freeze_frame_360"]], how="inner", left_on="original_event_id", right_on="event_id")
                this_game_events_spadl_df.dropna(subset=["freeze_frame_360"])

            # Filter action id with type shot only, pick only data from first period
            this_game_events_spadl_df = this_game_events_spadl_df[this_game_events_spadl_df['type_id'].isin(SHOT_ACTION_ID)]
            # if (period != None):
            #     this_game_events_spadl_df = this_game_events_spadl_df[this_game_events_spadl_df['period_id'] == period]
            # else:
            #     this_game_events_spadl_df = this_game_events_spadl_df[this_game_events_spadl_df['period_id'] == 1]
            
            # Add additional computed column to support xG model
            this_game_events_spadl_df = add_is_home_team_column_to_spadl_df(this_game_events_spadl_df, home_team_id)
            this_game_events_spadl_df = add_distance_to_goal_column_to_spadl_df(this_game_events_spadl_df)
            this_game_events_spadl_df = add_angle_to_goal_column_to_spadl_df(this_game_events_spadl_df)
            if (source == "Statsbomb"):
                this_game_events_spadl_df = add_distance_opponent_column_to_spadl_df(this_game_events_spadl_df)
                this_game_events_spadl_df = add_num_opponent_closer_goal_column_to_spadl_df(this_game_events_spadl_df, home_team_id)
                this_game_events_spadl_df = add_num_opponent_in_path_column_to_spadl_df(this_game_events_spadl_df)

            # Export to external csv iteratively
            this_game_events_spadl_df.to_csv(f'data/training_data_xgoal/{game_id}_{home_team_id}_{away_team_id}_xgoal_data.csv')
        
        except FileNotFoundError:
            print(f'File 360 data not found {game_id}-{home_team_id}-{away_team_id}') 

In [10]:
# MAIN DRIVER (comment it if csv files already loaded)
# collect_raw_goal_spadl_df(source="Statsbomb")

In [11]:
# Load csv datas already retrieved then concat them into one big dataframe
import os

DIRECTORY_XGOAL_CSV_DATAS = "data/training_data_xgoal"

def load_and_concat_xgoal_df_from_csv():
    list_pass_event_df = []
    for filename in os.listdir(DIRECTORY_XGOAL_CSV_DATAS):
        f = os.path.join(DIRECTORY_XGOAL_CSV_DATAS, filename)
        if os.path.isfile(f):
            pass_event_df = pd.read_csv(f)
            list_pass_event_df.append(pass_event_df)
    return pd.concat(list_pass_event_df)

In [12]:
# JOIN ALREADY CONSTRUCTED PLAYER SKILLS DATASET WITH ORIGIN EVENT DATASET WYSCOUT
DIRECTORY_FINAL_PLAYERS_CSV_DATAS = "data/players_skill_dataset/final_players_skill_dataset.csv"

player_skills_dataset = pd.read_csv(DIRECTORY_FINAL_PLAYERS_CSV_DATAS)
big_dataframe_xgoal_model = load_and_concat_xgoal_df_from_csv()
big_dataframe_xgoal_model = big_dataframe_xgoal_model.merge(player_skills_dataset, how='inner',on='player_id')
big_dataframe_xgoal_model.head()

Unnamed: 0,Unnamed: 0_x,game_id_x,original_event_id,period_id,time_seconds,team_id_x,player_id,start_x,start_y,end_x,...,LWB,LDM,CDM,RDM,RWB,LB,LCB,CB,RCB,RB
0,58,3788741,fc81639c-6e60-49d3-b29a-82b2b8c5746d,1,129.0,914,7788.0,4.764706,42.263291,0.0,...,60+3,58+3,58+3,58+3,60+3,58+3,55+3,55+3,55+3,58+3
1,518,3788741,5fae6701-47c3-4847-b346-5d792c0b94c1,1,1214.0,914,7788.0,20.205882,37.270886,13.411765,...,60+3,58+3,58+3,58+3,60+3,58+3,55+3,55+3,55+3,58+3
2,809,3788741,597f07f6-c84e-47d3-8033-05e3e46d7035,1,1925.0,914,7788.0,8.117647,40.283544,0.0,...,60+3,58+3,58+3,58+3,60+3,58+3,55+3,55+3,55+3,58+3
3,1091,3788741,8a902d87-4dcb-424a-8746-7d469802f594,1,2562.0,914,7788.0,14.558824,40.8,2.911765,...,60+3,58+3,58+3,58+3,60+3,58+3,55+3,55+3,55+3,58+3
4,1321,3788741,882d229d-aaf0-4b55-a601-3776fedb67f9,2,538.0,914,7788.0,7.323529,25.736709,0.0,...,60+3,58+3,58+3,58+3,60+3,58+3,55+3,55+3,55+3,58+3


In [13]:
# SELECT ONLY FEATURED COLUMN FROM BIG DATASETS
features_column_included = ["start_x", "start_y", "distance_to_goal", "angle_to_goal", "distance_opponent", "num_opponent_closer_goal", 
                            "num_opponent_in_path", "result_id"]
player_skills_column_included = ["acceleration", "aggression", "agility", "balance", "ball_control",
                                 "composure", "crossing", "curve", "dribbling", "finishing",
                                 "freekick_accuracy", "heading_accuracy", "interceptions", "jumping", "long_passing",
                                 "long_shots", "marking", "penalties", "positioning", "reactions",
                                 "shot_power", "sliding_tackle", "sprint_speed", "stamina", "short_passing",
                                 "standing_tackle", "strength", "vision", "volleys"]
player_attribute_column_included = ["height_cm", "weight_kgs", "age"]

big_dataframe_xgoal_model = big_dataframe_xgoal_model[[c for c in big_dataframe_xgoal_model.columns if c in (features_column_included + player_skills_column_included + player_attribute_column_included)]]
big_dataframe_xgoal_model.head()

Unnamed: 0,start_x,start_y,result_id,distance_to_goal,angle_to_goal,distance_opponent,num_opponent_closer_goal,num_opponent_in_path,age,height_cm,...,long_shots,aggression,interceptions,positioning,vision,penalties,composure,marking,standing_tackle,sliding_tackle
0,4.764706,42.263291,0,9.538574,0.422454,87.694924,0,0,29.0,185.42,...,80.0,77.0,40.0,91.0,65.0,78.0,81.0,34.0,33.0,32.0
1,20.205882,37.270886,0,20.468912,0.349692,58.649862,0,0,29.0,185.42,...,80.0,77.0,40.0,91.0,65.0,78.0,81.0,34.0,33.0,32.0
2,8.117647,40.283544,0,10.265433,0.573557,83.287978,0,0,29.0,185.42,...,80.0,77.0,40.0,91.0,65.0,78.0,81.0,34.0,33.0,32.0
3,14.558824,40.8,0,16.068582,0.410588,71.165678,0,0,29.0,185.42,...,80.0,77.0,40.0,91.0,65.0,78.0,81.0,34.0,33.0,32.0
4,7.323529,25.736709,0,11.041561,0.45883,83.654019,0,0,29.0,185.42,...,80.0,77.0,40.0,91.0,65.0,78.0,81.0,34.0,33.0,32.0


In [14]:
# CASE 1 : Random Oversample Function
def training_data_random_oversampled(X_train, Y_train):
    ros = RandomOverSampler(random_state=42)
    X_resampled, Y_resampled = ros.fit_resample(X_train, Y_train)
    return (X_resampled, Y_resampled)

# CASE 2 : Random Undersample Function
def training_data_random_undersampled(X_train, Y_train):
    rus = RandomUnderSampler(random_state=42)
    X_resampled, Y_resampled = rus.fit_resample(X_train, Y_train)
    return (X_resampled, Y_resampled)

# CASE 3 : Random SMOTE Oversample Function
def training_data_smote_oversampled(X_train, Y_train):
    X_resampled, Y_resampled = SMOTE().fit_resample(X_train, Y_train)
    return (X_resampled, Y_resampled)

# V CASE 1 : Feature Selection - Pearson Coefficient
def filter_columns_feature_selection_pearson(X_train, Y_train, columns_considered, threshold):
    new_columns_after_selection = []
    for _, skill in enumerate(columns_considered):
        correlation_value, _ = pearsonr(X_train[skill], Y_train)
        if correlation_value >= threshold:
            new_columns_after_selection.append(skill)
    return new_columns_after_selection

def training_data_feature_selection_pearson(X_train, Y_train, columns_considered, threshold):
    columns_selected = filter_columns_feature_selection_pearson(X_train, Y_train, columns_considered, threshold)
    columns_omitted = [x for x in columns_considered if x not in columns_selected]
    final_columns = [x for x in list(X_train.columns) if x not in columns_omitted]
    print(final_columns)
    return (X_train[final_columns], Y_train)

# V CASE 2 : Feature Selection - Chi Square
def filter_columns_feature_selection_chisquare(X_train, Y_train, columns_considered, num_of_features):
    chi2_selector = SelectKBest(chi2, k=num_of_features) 
    df_feature = X_train[columns_considered]
    chi2_selector.fit(df_feature, Y_train)
    cols = chi2_selector.get_support(indices=True)
    df_selected_features = df_feature.iloc[:,cols]
    return df_selected_features.columns

def training_data_feature_selection_chisquare(X_train, Y_train, columns_considered, num_of_features):
    columns_selected = filter_columns_feature_selection_chisquare(X_train, Y_train, columns_considered, num_of_features)
    columns_omitted = [x for x in columns_considered if x not in columns_selected]
    final_columns = [x for x in list(X_train.columns) if x not in columns_omitted]
    print(final_columns)
    return (X_train[final_columns], Y_train)

# V CASE 3 : Feature Selection - Mutual Information
def filter_columns_feature_selection_mutualinf(X_train, Y_train, columns_considered, num_of_features):
    mi_selector = SelectKBest(mutual_info_classif, k=num_of_features) 
    df_feature = X_train[columns_considered]
    mi_selector.fit(df_feature, Y_train)
    cols = mi_selector.get_support(indices=True)
    df_selected_features = df_feature.iloc[:,cols]
    return df_selected_features.columns

def training_data_feature_selection_mutualinf(X_train, Y_train, columns_considered, num_of_features):
    columns_selected = filter_columns_feature_selection_mutualinf(X_train, Y_train, columns_considered, num_of_features)
    columns_omitted = [x for x in columns_considered if x not in columns_selected]
    final_columns = [x for x in list(X_train.columns) if x not in columns_omitted]
    print(final_columns)
    return (X_train[final_columns], Y_train)

# V CASE 4 : Feature Selection - mRMR Selection
def filter_columns_feature_selection_mrmr(X_train, Y_train, columns_considered, num_of_features):
    df_feature = X_train[columns_considered]
    selected_features = mrmr_classif(X=df_feature, y=Y_train, K=num_of_features)
    return selected_features

def training_data_feature_selection_mrmr(X_train, Y_train, columns_considered, num_of_features):
    columns_selected = filter_columns_feature_selection_mrmr(X_train, Y_train, columns_considered, num_of_features)
    columns_omitted = [x for x in columns_considered if x not in columns_selected]
    final_columns = [x for x in list(X_train.columns) if x not in columns_omitted]
    print(final_columns)
    return (X_train[final_columns], Y_train)

# X CASE 5 : Feature Selection - Sequential Forward Selection (SFS)
def filter_columns_feature_selection_sfs(X_train, Y_train, columns_considered, num_of_features):
    rf = RandomForestClassifier()
    sfs = SequentialFeatureSelector(rf, n_features_to_select=num_of_features, direction='forward')
    df_feature = X_train[columns_considered]
    sfs.fit(df_feature, Y_train)
    cols = sfs.get_support(indices=True)
    df_selected_features = df_feature.iloc[:,cols]
    return df_selected_features.columns

def training_data_feature_selection_sfs(X_train, Y_train, columns_considered, num_of_features):
    columns_selected = filter_columns_feature_selection_sfs(X_train, Y_train, columns_considered, num_of_features)
    columns_omitted = [x for x in columns_considered if x not in columns_selected]
    final_columns = [x for x in list(X_train.columns) if x not in columns_omitted]
    print(final_columns)
    return (X_train[final_columns], Y_train)

# X CASE 6 : Feature Selection - Sequential Backward Elimination (SBE)
def filter_columns_feature_selection_sbe(X_train, Y_train, columns_considered, num_of_features):
    rf = RandomForestClassifier()
    sfs = SequentialFeatureSelector(rf, n_features_to_select=num_of_features, direction='backward')
    df_feature = X_train[columns_considered]
    sfs.fit(df_feature, Y_train)
    cols = sfs.get_support(indices=True)
    df_selected_features = df_feature.iloc[:,cols]
    return df_selected_features.columns

def training_data_feature_selection_sbe(X_train, Y_train, columns_considered, num_of_features):
    columns_selected = filter_columns_feature_selection_sbe(X_train, Y_train, columns_considered, num_of_features)
    columns_omitted = [x for x in columns_considered if x not in columns_selected]
    final_columns = [x for x in list(X_train.columns) if x not in columns_omitted]
    print(final_columns)
    return (X_train[final_columns], Y_train)

# X CASE 7 : Feature Selection - Recursive Feature Elimination
def filter_columns_feature_selection_rfe(X_train, Y_train, columns_considered, num_of_features):
    estimator = LinearSVR()
    selector = RFECV(estimator, step=1, cv=num_of_features)
    df_feature = X_train[columns_considered]
    selector.fit(df_feature, Y_train)
    cols = selector.get_support(indices=True)
    df_selected_features = df_feature.iloc[:,cols]
    return df_selected_features.columns

def training_data_feature_selection_rfe(X_train, Y_train, columns_considered, num_of_features):
    columns_selected = filter_columns_feature_selection_rfe(X_train, Y_train, columns_considered, num_of_features)
    columns_omitted = [x for x in columns_considered if x not in columns_selected]
    final_columns = [x for x in list(X_train.columns) if x not in columns_omitted]
    print(final_columns)
    return (X_train[final_columns], Y_train)

# V CASE 8 : Feature Selection - Random Forest Embedded (rfembedded)
def filter_columns_feature_selection_rfembedded(X_train, Y_train, columns_considered, num_of_features):
    estimator = RandomForestClassifier()
    selector = SelectFromModel(estimator=estimator, max_features=num_of_features)
    df_feature = X_train[columns_considered]
    selector.fit(df_feature, Y_train)
    cols = selector.get_support(indices=True)
    df_selected_features = df_feature.iloc[:,cols]
    return df_selected_features.columns

def training_data_feature_selection_rfembedded(X_train, Y_train, columns_considered, num_of_features):
    columns_selected = filter_columns_feature_selection_rfembedded(X_train, Y_train, columns_considered, num_of_features)
    columns_omitted = [x for x in columns_considered if x not in columns_selected]
    final_columns = [x for x in list(X_train.columns) if x not in columns_omitted]
    print(final_columns)
    return (X_train[final_columns], Y_train)

# V CASE 9 : Feature Selection - LASSO
def filter_columns_feature_selection_lasso(X_train, Y_train, columns_considered, num_of_features):
    estimator = LogisticRegression(penalty='l2', C=0.5, solver='newton-cholesky')
    selector = SelectFromModel(estimator=estimator, max_features=num_of_features)
    df_feature = X_train[columns_considered]
    selector.fit(df_feature, Y_train)
    cols = selector.get_support(indices=True)
    df_selected_features = df_feature.iloc[:,cols]
    return df_selected_features.columns

def training_data_feature_selection_lasso(X_train, Y_train, columns_considered, num_of_features):
    columns_selected = filter_columns_feature_selection_lasso(X_train, Y_train, columns_considered, num_of_features)
    columns_omitted = [x for x in columns_considered if x not in columns_selected]
    final_columns = [x for x in list(X_train.columns) if x not in columns_omitted]
    print(final_columns)
    return (X_train[final_columns], Y_train)

# CASE 1 : Train with model XGBRegressor
def fit_and_train_with_model_xgbregressor(X_train, Y_train):
    model = XGBRegressor(objective="reg:logistic")
    model.fit(X_train, Y_train)
    return model

# CASE 2 : Train with model RandomForestRegressor
def fit_and_train_with_model_rfregressor(X_train, Y_train):
    model = RandomForestRegressor()
    model.fit(X_train, Y_train)
    return model

# CASE 3 : Train with model LogisticRegression
def fit_and_train_with_model_logregression(X_train, Y_train):
    model = LogisticRegression()
    model.fit(X_train, Y_train)
    return model

# CASE 4 : Train with model XGBClassifier
def fit_and_train_with_model_xgbclassifier(X_train, Y_train):
    model = XGBClassifier(n_estimators=50, max_depth=3, n_jobs=-3, verbosity=1, enable_categorical=True)
    model.fit(X_train, Y_train)
    return model

# CASE 5 : Train with model Catboost Classifier 
def fit_and_train_with_model_catboostclassifier(X_train, Y_train):
    model = CatBoostClassifier(n_estimators=50, max_depth=3, verbose=1)
    model.fit(X_train, Y_train)
    return model

# CASE 6 : Train with model RandomForest Classifier
def fit_and_train_with_model_rfclassifier(X_train, Y_train):
    model = RandomForestClassifier(n_estimators=50, max_depth=3, n_jobs=-3, verbose=1)
    model.fit(X_train, Y_train)
    return model

In [15]:
# FEATURE PREPROCESSING BIG DATASETS AND CREATE XGBOOST MODEL
# 1. Change all numeric columns with MinMaxScaler
scaler = preprocessing.MinMaxScaler(feature_range=(0,1))
columns_minmax_scaler = player_skills_column_included + player_attribute_column_included + \
                        ["start_x", "start_y", "distance_to_goal", "angle_to_goal", 
                        "distance_opponent", "num_opponent_closer_goal", "num_opponent_in_path"]
# Store Description for all Numeric Columns in External CSV
df_description_numeric = big_dataframe_xgoal_model[columns_minmax_scaler].describe()
filename = 'xgoal_description_numeric_data.csv'
directory_model = "data/model_xgoal/"
df_description_numeric.to_csv(directory_model + filename)
# Preprocess to minmax scaler
big_dataframe_xgoal_model[columns_minmax_scaler] = scaler.fit_transform(big_dataframe_xgoal_model[columns_minmax_scaler])

# 2. Check if data is unbalanced. If it is unbalanced, then do method to oversize the sample
print(big_dataframe_xgoal_model['result_id'].value_counts())

# 3. Change result_id label into float64 type
# big_dataframe_xgoal_model['result_id'] = big_dataframe_xgoal_model['result_id'].astype('float64')

# 4. Remove dataframe instead of having result_id (0,1) --> (fail, success)
big_dataframe_xgoal_model = big_dataframe_xgoal_model[big_dataframe_xgoal_model['result_id'].isin([0,1])]
print(big_dataframe_xgoal_model['result_id'].value_counts())

# 5. Split train data and test data from Big Datasets
all_feature_columns = columns_minmax_scaler
X_train = big_dataframe_xgoal_model[all_feature_columns]
Y_train = big_dataframe_xgoal_model["result_id"]

# Empty dataframe for saving test result
empty_test_result = pd.DataFrame(columns=COLUMNS_EXPERIMENT_RESULT, index=[0])

for case_number in sorted(list(CONFIG_EXPERIMENTS_SCENARIO_MAP.keys())):
    include_skill_opt = CONFIG_EXPERIMENTS_SCENARIO_MAP[case_number]["include_skill_opt"]
    sampling_opt = CONFIG_EXPERIMENTS_SCENARIO_MAP[case_number]["sampling_opt"]
    feature_selection_opt = CONFIG_EXPERIMENTS_SCENARIO_MAP[case_number]["feature_selection_opt"]
    algorithm_opt = CONFIG_EXPERIMENTS_SCENARIO_MAP[case_number]["algorithm_opt"]

    # 6. Filter out all player skills and attributes column if not include skill option
    if include_skill_opt == 0:
        only_featured_column = [column for column in features_column_included if column != 'result_id']
        X_train_filtered = X_train[only_featured_column]
    else:
        X_train_filtered = X_train

    # 7. Do oversampling/undersampling and feature selection at same time
    if sampling_opt == "none":
        X_resampled, Y_resampled = X_train_filtered, Y_train
    else:
        X_resampled, Y_resampled = globals()["training_data_" + sampling_opt](X_train_filtered, Y_train)
    if feature_selection_opt == "none":
        X_feature_sel, Y_feature_sel = X_resampled, Y_resampled
    else:
        if feature_selection_opt == "pearson":
            threshold = 0.5
            X_feature_sel, Y_feature_sel = globals()["training_data_feature_selection_" + feature_selection_opt](X_resampled, Y_resampled, player_skills_column_included, threshold)
        else:
            num_of_features = 10
            X_feature_sel, Y_feature_sel = globals()["training_data_feature_selection_" + feature_selection_opt](X_resampled, Y_resampled, player_skills_column_included, num_of_features)      

    # 8. Do train_test_split on training data
    X_train_split, X_test_split, y_train_split, y_test_split = train_test_split(X_feature_sel, Y_feature_sel, test_size=0.2, random_state=42)

    # 9. Train Model
    model = globals()["fit_and_train_with_model_" + algorithm_opt](X_train_split, y_train_split)

    # 10. Predict Testing Data
    y_predict = model.predict(X_test_split)

    # 11. Save test result experiment
    if (USE_EVALUATION_METRIC_CLASSIFICATION):
        rec_score = recall_score(y_test_split, y_predict)
        prec_score = precision_score(y_test_split, y_predict)
        F1_score = f1_score(y_test_split, y_predict)
        acc_score = accuracy_score(y_test_split, y_predict)
        auc_score = roc_auc_score(y_test_split, y_predict)
        mcc_score = matthews_corrcoef(y_test_split, y_predict)
        brier_score = brier_score_loss(y_test_split, y_predict)
        log_loss_score = log_loss(y_test_split, y_predict)
        balanced_acc_score = balanced_accuracy_score(y_test_split, y_predict)
    else:
        mean_squared_error_score = mean_squared_error(y_test_split, y_predict)
        root_mean_squared_error_score = mean_squared_error(y_test_split, y_predict, squared=False)
        auc_score = roc_auc_score(y_test_split, y_predict)
        brier_score = brier_score_loss(y_test_split, y_predict)
        log_loss_score = log_loss(y_test_split, y_predict)
        mean_absolute_error_score = mean_absolute_error(y_test_split, y_predict)
        r_squared_score = r2_score(y_test_split, y_predict)
        mean_absolute_percentage_error_score = mean_absolute_percentage_error(y_test_split, y_predict)

    maps_new_row = {}
    if USE_EVALUATION_METRIC_CLASSIFICATION:
        eval_metrics_column = COLUMNS_EVALUATION_METRIC_CLASSIFICATION
    else:
        eval_metrics_column = COLUMNS_EVALUATION_METRIC_REGRESSION
    for column in COLUMNS_EXPERIMENT_RESULT:
        if column not in eval_metrics_column:
            if column == "case_number":
                maps_new_row["case_number"] = case_number
            elif column in COLUMNS_SCENARIO_NAME:
                maps_new_row[column] = globals()[column]
        else:
            maps_new_row[column] = globals()[column]     
    new_row = pd.DataFrame(maps_new_row, index=[0])
    empty_test_result = pd.concat([new_row, empty_test_result.loc[:]]).reset_index(drop=True)

    # 12. Save model to external file
    filename = f'xgoal_model_case_{case_number}.sav'
    directory_model = "data/model_xgoal/"
    pickle.dump(model, open(directory_model + filename, 'wb'))

# 13. Save test result experiment to external file
filename = 'xgoal_test_model_experiment_result.csv'
directory_model = "data/model_xgoal/"
empty_test_result.to_csv(directory_model + filename)


0    1954
1     294
Name: result_id, dtype: int64
0    1954
1     294
Name: result_id, dtype: int64
Learning rate set to 0.20643
0:	learn: 0.5947560	total: 144ms	remaining: 7.05s
1:	learn: 0.5278472	total: 144ms	remaining: 3.47s
2:	learn: 0.4763923	total: 145ms	remaining: 2.27s
3:	learn: 0.4403506	total: 146ms	remaining: 1.67s
4:	learn: 0.4147960	total: 146ms	remaining: 1.31s
5:	learn: 0.3949336	total: 147ms	remaining: 1.07s
6:	learn: 0.3779389	total: 147ms	remaining: 904ms
7:	learn: 0.3656392	total: 148ms	remaining: 775ms
8:	learn: 0.3579662	total: 148ms	remaining: 675ms
9:	learn: 0.3500678	total: 149ms	remaining: 594ms
10:	learn: 0.3457770	total: 149ms	remaining: 528ms
11:	learn: 0.3398641	total: 149ms	remaining: 473ms
12:	learn: 0.3340561	total: 150ms	remaining: 427ms
13:	learn: 0.3304816	total: 150ms	remaining: 387ms
14:	learn: 0.3273719	total: 151ms	remaining: 352ms
15:	learn: 0.3253392	total: 151ms	remaining: 321ms
16:	learn: 0.3241314	total: 152ms	remaining: 294ms
17:	learn: 0.3

[Parallel(n_jobs=-3)]: Using backend ThreadingBackend with 10 concurrent workers.
[Parallel(n_jobs=-3)]: Done  30 tasks      | elapsed:    0.0s
[Parallel(n_jobs=-3)]: Done  50 out of  50 | elapsed:    0.0s finished
[Parallel(n_jobs=10)]: Using backend ThreadingBackend with 10 concurrent workers.
[Parallel(n_jobs=10)]: Done  30 tasks      | elapsed:    0.0s
[Parallel(n_jobs=10)]: Done  50 out of  50 | elapsed:    0.0s finished


0:	learn: 0.6383776	total: 916us	remaining: 44.9ms
1:	learn: 0.6058333	total: 1.77ms	remaining: 42.4ms
2:	learn: 0.5809082	total: 2.4ms	remaining: 37.7ms
3:	learn: 0.5653311	total: 3.19ms	remaining: 36.7ms
4:	learn: 0.5524160	total: 3.88ms	remaining: 34.9ms
5:	learn: 0.5443999	total: 4.61ms	remaining: 33.8ms
6:	learn: 0.5373058	total: 5.3ms	remaining: 32.6ms
7:	learn: 0.5338378	total: 5.97ms	remaining: 31.4ms
8:	learn: 0.5303751	total: 6.78ms	remaining: 30.9ms
9:	learn: 0.5271613	total: 7.53ms	remaining: 30.1ms
10:	learn: 0.5227470	total: 8.15ms	remaining: 28.9ms
11:	learn: 0.5199874	total: 8.82ms	remaining: 27.9ms
12:	learn: 0.5162835	total: 9.46ms	remaining: 26.9ms
13:	learn: 0.5131808	total: 10.1ms	remaining: 26.1ms
14:	learn: 0.5108107	total: 10.8ms	remaining: 25.1ms
15:	learn: 0.5094464	total: 11.4ms	remaining: 24.3ms
16:	learn: 0.5038919	total: 12.2ms	remaining: 23.6ms
17:	learn: 0.5018659	total: 13.2ms	remaining: 23.5ms
18:	learn: 0.4997628	total: 14ms	remaining: 22.8ms
19:	lear

[Parallel(n_jobs=-3)]: Using backend ThreadingBackend with 10 concurrent workers.
[Parallel(n_jobs=-3)]: Done  30 tasks      | elapsed:    0.0s
[Parallel(n_jobs=-3)]: Done  50 out of  50 | elapsed:    0.0s finished
[Parallel(n_jobs=10)]: Using backend ThreadingBackend with 10 concurrent workers.
[Parallel(n_jobs=10)]: Done  30 tasks      | elapsed:    0.0s
[Parallel(n_jobs=10)]: Done  50 out of  50 | elapsed:    0.0s finished
[Parallel(n_jobs=-3)]: Using backend ThreadingBackend with 10 concurrent workers.


Learning rate set to 0.116403
0:	learn: 0.6674741	total: 701us	remaining: 34.4ms
1:	learn: 0.6492751	total: 2.32ms	remaining: 55.7ms
2:	learn: 0.6296788	total: 2.81ms	remaining: 44ms
3:	learn: 0.6167164	total: 3.41ms	remaining: 39.2ms
4:	learn: 0.6065532	total: 3.77ms	remaining: 33.9ms
5:	learn: 0.5976321	total: 4.21ms	remaining: 30.9ms
6:	learn: 0.5908433	total: 4.61ms	remaining: 28.3ms
7:	learn: 0.5836593	total: 5.08ms	remaining: 26.7ms
8:	learn: 0.5757832	total: 5.44ms	remaining: 24.8ms
9:	learn: 0.5673072	total: 5.79ms	remaining: 23.1ms
10:	learn: 0.5624796	total: 6.2ms	remaining: 22ms
11:	learn: 0.5582537	total: 6.58ms	remaining: 20.8ms
12:	learn: 0.5536090	total: 6.93ms	remaining: 19.7ms
13:	learn: 0.5493503	total: 7.28ms	remaining: 18.7ms
14:	learn: 0.5439279	total: 7.73ms	remaining: 18ms
15:	learn: 0.5421960	total: 8.07ms	remaining: 17.1ms
16:	learn: 0.5383525	total: 8.43ms	remaining: 16.4ms
17:	learn: 0.5357552	total: 8.76ms	remaining: 15.6ms
18:	learn: 0.5332217	total: 9.1ms	

[Parallel(n_jobs=-3)]: Done  30 tasks      | elapsed:    0.0s
[Parallel(n_jobs=-3)]: Done  50 out of  50 | elapsed:    0.0s finished
[Parallel(n_jobs=10)]: Using backend ThreadingBackend with 10 concurrent workers.
[Parallel(n_jobs=10)]: Done  30 tasks      | elapsed:    0.0s
[Parallel(n_jobs=10)]: Done  50 out of  50 | elapsed:    0.0s finished
[Parallel(n_jobs=-3)]: Using backend ThreadingBackend with 10 concurrent workers.


Learning rate set to 0.26142
0:	learn: 0.6406252	total: 946us	remaining: 46.4ms
1:	learn: 0.6037448	total: 1.81ms	remaining: 43.5ms
2:	learn: 0.5759297	total: 2.5ms	remaining: 39.1ms
3:	learn: 0.5615933	total: 3.32ms	remaining: 38.1ms
4:	learn: 0.5508680	total: 4.32ms	remaining: 38.9ms
5:	learn: 0.5424847	total: 5.08ms	remaining: 37.3ms
6:	learn: 0.5363268	total: 6.47ms	remaining: 39.7ms
7:	learn: 0.5311328	total: 7.25ms	remaining: 38.1ms
8:	learn: 0.5238716	total: 8ms	remaining: 36.4ms
9:	learn: 0.5166819	total: 8.8ms	remaining: 35.2ms
10:	learn: 0.5109303	total: 9.51ms	remaining: 33.7ms
11:	learn: 0.5070949	total: 10.3ms	remaining: 32.6ms
12:	learn: 0.5033186	total: 11ms	remaining: 31.4ms
13:	learn: 0.4994411	total: 13.4ms	remaining: 34.3ms
14:	learn: 0.4971263	total: 14.3ms	remaining: 33.3ms
15:	learn: 0.4936580	total: 14.9ms	remaining: 31.8ms
16:	learn: 0.4910501	total: 16.1ms	remaining: 31.2ms
17:	learn: 0.4886164	total: 16.9ms	remaining: 30ms
18:	learn: 0.4867730	total: 17.6ms	re

[Parallel(n_jobs=-3)]: Done  30 tasks      | elapsed:    0.0s
[Parallel(n_jobs=-3)]: Done  50 out of  50 | elapsed:    0.0s finished
[Parallel(n_jobs=10)]: Using backend ThreadingBackend with 10 concurrent workers.
[Parallel(n_jobs=10)]: Done  30 tasks      | elapsed:    0.0s
[Parallel(n_jobs=10)]: Done  50 out of  50 | elapsed:    0.0s finished


['height_cm', 'weight_kgs', 'age', 'start_x', 'start_y', 'distance_to_goal', 'angle_to_goal', 'distance_opponent', 'num_opponent_closer_goal', 'num_opponent_in_path']
Learning rate set to 0.20643
0:	learn: 0.5899069	total: 2.31ms	remaining: 113ms
1:	learn: 0.5224069	total: 2.99ms	remaining: 71.9ms
2:	learn: 0.4737403	total: 3.55ms	remaining: 55.6ms
3:	learn: 0.4385986	total: 4.19ms	remaining: 48.2ms
4:	learn: 0.4165458	total: 4.77ms	remaining: 42.9ms
5:	learn: 0.3978155	total: 5.39ms	remaining: 39.5ms
6:	learn: 0.3828627	total: 6ms	remaining: 36.8ms
7:	learn: 0.3711179	total: 6.53ms	remaining: 34.3ms
8:	learn: 0.3584445	total: 7ms	remaining: 31.9ms
9:	learn: 0.3514999	total: 7.47ms	remaining: 29.9ms
10:	learn: 0.3462628	total: 8.03ms	remaining: 28.5ms
11:	learn: 0.3406782	total: 9.14ms	remaining: 29ms
12:	learn: 0.3388653	total: 10ms	remaining: 28.5ms
13:	learn: 0.3344032	total: 10.9ms	remaining: 28ms
14:	learn: 0.3333608	total: 11.5ms	remaining: 26.8ms
15:	learn: 0.3304350	total: 12ms

[Parallel(n_jobs=-3)]: Using backend ThreadingBackend with 10 concurrent workers.
[Parallel(n_jobs=-3)]: Done  30 tasks      | elapsed:    0.0s
[Parallel(n_jobs=-3)]: Done  50 out of  50 | elapsed:    0.0s finished
[Parallel(n_jobs=10)]: Using backend ThreadingBackend with 10 concurrent workers.
[Parallel(n_jobs=10)]: Done  30 tasks      | elapsed:    0.0s
[Parallel(n_jobs=10)]: Done  50 out of  50 | elapsed:    0.0s finished


['curve', 'finishing', 'freekick_accuracy', 'interceptions', 'marking', 'penalties', 'positioning', 'sliding_tackle', 'standing_tackle', 'volleys', 'height_cm', 'weight_kgs', 'age', 'start_x', 'start_y', 'distance_to_goal', 'angle_to_goal', 'distance_opponent', 'num_opponent_closer_goal', 'num_opponent_in_path']
['curve', 'finishing', 'freekick_accuracy', 'interceptions', 'marking', 'penalties', 'positioning', 'sliding_tackle', 'standing_tackle', 'volleys', 'height_cm', 'weight_kgs', 'age', 'start_x', 'start_y', 'distance_to_goal', 'angle_to_goal', 'distance_opponent', 'num_opponent_closer_goal', 'num_opponent_in_path']
Learning rate set to 0.20643
0:	learn: 0.5439590	total: 1.5ms	remaining: 73.3ms
1:	learn: 0.4542717	total: 2.98ms	remaining: 71.5ms
2:	learn: 0.4085214	total: 4.29ms	remaining: 67.2ms
3:	learn: 0.3889328	total: 6.53ms	remaining: 75.1ms
4:	learn: 0.3672688	total: 8.15ms	remaining: 73.3ms
5:	learn: 0.3605182	total: 9.72ms	remaining: 71.3ms
6:	learn: 0.3497821	total: 11ms	

[Parallel(n_jobs=-3)]: Using backend ThreadingBackend with 10 concurrent workers.
[Parallel(n_jobs=-3)]: Done  30 tasks      | elapsed:    0.0s
[Parallel(n_jobs=-3)]: Done  50 out of  50 | elapsed:    0.0s finished
[Parallel(n_jobs=10)]: Using backend ThreadingBackend with 10 concurrent workers.
[Parallel(n_jobs=10)]: Done  30 tasks      | elapsed:    0.0s
[Parallel(n_jobs=10)]: Done  50 out of  50 | elapsed:    0.0s finished


['acceleration', 'aggression', 'agility', 'finishing', 'jumping', 'long_passing', 'long_shots', 'penalties', 'reactions', 'sliding_tackle', 'height_cm', 'weight_kgs', 'age', 'start_x', 'start_y', 'distance_to_goal', 'angle_to_goal', 'distance_opponent', 'num_opponent_closer_goal', 'num_opponent_in_path']
['agility', 'ball_control', 'dribbling', 'jumping', 'marking', 'penalties', 'reactions', 'standing_tackle', 'strength', 'volleys', 'height_cm', 'weight_kgs', 'age', 'start_x', 'start_y', 'distance_to_goal', 'angle_to_goal', 'distance_opponent', 'num_opponent_closer_goal', 'num_opponent_in_path']
Learning rate set to 0.20643
0:	learn: 0.5440341	total: 1.82ms	remaining: 89.3ms
1:	learn: 0.4548183	total: 3.26ms	remaining: 78.2ms
2:	learn: 0.4088315	total: 4.53ms	remaining: 71ms
3:	learn: 0.3883963	total: 5.69ms	remaining: 65.5ms
4:	learn: 0.3666271	total: 6.9ms	remaining: 62.1ms
5:	learn: 0.3599648	total: 8.24ms	remaining: 60.4ms
6:	learn: 0.3493923	total: 9.42ms	remaining: 57.9ms
7:	lear

[Parallel(n_jobs=-3)]: Using backend ThreadingBackend with 10 concurrent workers.
[Parallel(n_jobs=-3)]: Done  30 tasks      | elapsed:    0.0s
[Parallel(n_jobs=-3)]: Done  50 out of  50 | elapsed:    0.0s finished
[Parallel(n_jobs=10)]: Using backend ThreadingBackend with 10 concurrent workers.
[Parallel(n_jobs=10)]: Done  30 tasks      | elapsed:    0.0s
[Parallel(n_jobs=10)]: Done  50 out of  50 | elapsed:    0.0s finished
100%|██████████| 10/10 [00:00<00:00, 63.01it/s]


['ball_control', 'finishing', 'interceptions', 'jumping', 'marking', 'penalties', 'positioning', 'sliding_tackle', 'standing_tackle', 'volleys', 'height_cm', 'weight_kgs', 'age', 'start_x', 'start_y', 'distance_to_goal', 'angle_to_goal', 'distance_opponent', 'num_opponent_closer_goal', 'num_opponent_in_path']


100%|██████████| 10/10 [00:00<00:00, 55.96it/s]


['ball_control', 'finishing', 'interceptions', 'jumping', 'marking', 'penalties', 'positioning', 'sliding_tackle', 'standing_tackle', 'volleys', 'height_cm', 'weight_kgs', 'age', 'start_x', 'start_y', 'distance_to_goal', 'angle_to_goal', 'distance_opponent', 'num_opponent_closer_goal', 'num_opponent_in_path']
Learning rate set to 0.20643
0:	learn: 0.5419835	total: 1.72ms	remaining: 84.1ms
1:	learn: 0.4534164	total: 3.28ms	remaining: 78.6ms
2:	learn: 0.4078851	total: 4.4ms	remaining: 68.9ms
3:	learn: 0.3882000	total: 5.54ms	remaining: 63.7ms
4:	learn: 0.3666735	total: 6.63ms	remaining: 59.6ms
5:	learn: 0.3600553	total: 7.71ms	remaining: 56.6ms
6:	learn: 0.3494004	total: 8.77ms	remaining: 53.9ms
7:	learn: 0.3438232	total: 9.83ms	remaining: 51.6ms
8:	learn: 0.3391940	total: 11.1ms	remaining: 50.8ms
9:	learn: 0.3337924	total: 12.4ms	remaining: 49.4ms
10:	learn: 0.3314383	total: 13.6ms	remaining: 48.1ms
11:	learn: 0.3276322	total: 14.7ms	remaining: 46.7ms
12:	learn: 0.3229252	total: 15.9ms	

100%|██████████| 10/10 [00:00<00:00, 61.71it/s]
[Parallel(n_jobs=-3)]: Using backend ThreadingBackend with 10 concurrent workers.
[Parallel(n_jobs=-3)]: Done  30 tasks      | elapsed:    0.0s
[Parallel(n_jobs=-3)]: Done  50 out of  50 | elapsed:    0.0s finished
[Parallel(n_jobs=10)]: Using backend ThreadingBackend with 10 concurrent workers.
[Parallel(n_jobs=10)]: Done  30 tasks      | elapsed:    0.0s
[Parallel(n_jobs=10)]: Done  50 out of  50 | elapsed:    0.0s finished


['ball_control', 'finishing', 'interceptions', 'jumping', 'marking', 'penalties', 'positioning', 'sliding_tackle', 'standing_tackle', 'volleys', 'height_cm', 'weight_kgs', 'age', 'start_x', 'start_y', 'distance_to_goal', 'angle_to_goal', 'distance_opponent', 'num_opponent_closer_goal', 'num_opponent_in_path']
['finishing', 'heading_accuracy', 'long_shots', 'marking', 'penalties', 'positioning', 'sliding_tackle', 'standing_tackle', 'strength', 'volleys', 'height_cm', 'weight_kgs', 'age', 'start_x', 'start_y', 'distance_to_goal', 'angle_to_goal', 'distance_opponent', 'num_opponent_closer_goal', 'num_opponent_in_path']
['acceleration', 'curve', 'freekick_accuracy', 'heading_accuracy', 'long_shots', 'marking', 'penalties', 'sliding_tackle', 'strength', 'volleys', 'height_cm', 'weight_kgs', 'age', 'start_x', 'start_y', 'distance_to_goal', 'angle_to_goal', 'distance_opponent', 'num_opponent_closer_goal', 'num_opponent_in_path']
Learning rate set to 0.20643
0:	learn: 0.5428853	total: 1.31ms	r

[Parallel(n_jobs=-3)]: Using backend ThreadingBackend with 10 concurrent workers.
[Parallel(n_jobs=-3)]: Done  30 tasks      | elapsed:    0.0s
[Parallel(n_jobs=-3)]: Done  50 out of  50 | elapsed:    0.0s finished
[Parallel(n_jobs=10)]: Using backend ThreadingBackend with 10 concurrent workers.
[Parallel(n_jobs=10)]: Done  30 tasks      | elapsed:    0.0s
[Parallel(n_jobs=10)]: Done  50 out of  50 | elapsed:    0.0s finished


44:	learn: 0.2780298	total: 58.4ms	remaining: 6.49ms
45:	learn: 0.2772818	total: 59.7ms	remaining: 5.19ms
46:	learn: 0.2769728	total: 61ms	remaining: 3.9ms
47:	learn: 0.2757916	total: 62.3ms	remaining: 2.59ms
48:	learn: 0.2747385	total: 63.6ms	remaining: 1.3ms
49:	learn: 0.2733888	total: 64.8ms	remaining: 0us
['acceleration', 'aggression', 'agility', 'heading_accuracy', 'jumping', 'long_shots', 'marking', 'penalties', 'short_passing', 'vision', 'height_cm', 'weight_kgs', 'age', 'start_x', 'start_y', 'distance_to_goal', 'angle_to_goal', 'distance_opponent', 'num_opponent_closer_goal', 'num_opponent_in_path']
['height_cm', 'weight_kgs', 'age', 'start_x', 'start_y', 'distance_to_goal', 'angle_to_goal', 'distance_opponent', 'num_opponent_closer_goal', 'num_opponent_in_path']


[Parallel(n_jobs=-3)]: Using backend ThreadingBackend with 10 concurrent workers.
[Parallel(n_jobs=-3)]: Done  30 tasks      | elapsed:    0.0s
[Parallel(n_jobs=-3)]: Done  50 out of  50 | elapsed:    0.0s finished
[Parallel(n_jobs=10)]: Using backend ThreadingBackend with 10 concurrent workers.
[Parallel(n_jobs=10)]: Done  30 tasks      | elapsed:    0.0s
[Parallel(n_jobs=10)]: Done  50 out of  50 | elapsed:    0.0s finished


['height_cm', 'weight_kgs', 'age', 'start_x', 'start_y', 'distance_to_goal', 'angle_to_goal', 'distance_opponent', 'num_opponent_closer_goal', 'num_opponent_in_path']
Learning rate set to 0.26142
0:	learn: 0.6378525	total: 791us	remaining: 38.8ms
1:	learn: 0.6054523	total: 2.06ms	remaining: 49.4ms
2:	learn: 0.5842650	total: 2.82ms	remaining: 44.1ms
3:	learn: 0.5699416	total: 3.43ms	remaining: 39.4ms
4:	learn: 0.5515581	total: 4.23ms	remaining: 38.1ms
5:	learn: 0.5436632	total: 4.93ms	remaining: 36.2ms
6:	learn: 0.5389636	total: 5.65ms	remaining: 34.7ms
7:	learn: 0.5337741	total: 6.45ms	remaining: 33.9ms
8:	learn: 0.5289772	total: 7.1ms	remaining: 32.3ms
9:	learn: 0.5258201	total: 7.77ms	remaining: 31.1ms
10:	learn: 0.5211909	total: 8.4ms	remaining: 29.8ms
11:	learn: 0.5183311	total: 9.18ms	remaining: 29.1ms
12:	learn: 0.5146703	total: 9.85ms	remaining: 28ms
13:	learn: 0.5100063	total: 10.4ms	remaining: 26.8ms
14:	learn: 0.5075991	total: 11.1ms	remaining: 25.8ms
15:	learn: 0.5058930	tot

[Parallel(n_jobs=-3)]: Using backend ThreadingBackend with 10 concurrent workers.
[Parallel(n_jobs=-3)]: Done  30 tasks      | elapsed:    0.0s
[Parallel(n_jobs=-3)]: Done  50 out of  50 | elapsed:    0.0s finished
[Parallel(n_jobs=10)]: Using backend ThreadingBackend with 10 concurrent workers.
[Parallel(n_jobs=10)]: Done  30 tasks      | elapsed:    0.0s
[Parallel(n_jobs=10)]: Done  50 out of  50 | elapsed:    0.0s finished


['aggression', 'finishing', 'interceptions', 'jumping', 'marking', 'penalties', 'positioning', 'sliding_tackle', 'standing_tackle', 'volleys', 'height_cm', 'weight_kgs', 'age', 'start_x', 'start_y', 'distance_to_goal', 'angle_to_goal', 'distance_opponent', 'num_opponent_closer_goal', 'num_opponent_in_path']
Learning rate set to 0.26142
0:	learn: 0.6274589	total: 1.58ms	remaining: 77.7ms
1:	learn: 0.5922234	total: 3.16ms	remaining: 75.8ms
2:	learn: 0.5763836	total: 5.2ms	remaining: 81.5ms
3:	learn: 0.5618192	total: 6.91ms	remaining: 79.5ms
4:	learn: 0.5458981	total: 8.32ms	remaining: 74.9ms
5:	learn: 0.5390062	total: 10.1ms	remaining: 73.7ms
6:	learn: 0.5301040	total: 11.5ms	remaining: 70.5ms
7:	learn: 0.5205494	total: 12.7ms	remaining: 66.9ms
8:	learn: 0.5148123	total: 14.1ms	remaining: 64.3ms
9:	learn: 0.5110214	total: 15.4ms	remaining: 61.7ms
10:	learn: 0.5062191	total: 16.7ms	remaining: 59.1ms
11:	learn: 0.5019661	total: 18ms	remaining: 57ms
12:	learn: 0.4995184	total: 19.6ms	remain

[Parallel(n_jobs=-3)]: Using backend ThreadingBackend with 10 concurrent workers.
[Parallel(n_jobs=-3)]: Done  30 tasks      | elapsed:    0.0s
[Parallel(n_jobs=-3)]: Done  50 out of  50 | elapsed:    0.0s finished
[Parallel(n_jobs=10)]: Using backend ThreadingBackend with 10 concurrent workers.
[Parallel(n_jobs=10)]: Done  30 tasks      | elapsed:    0.0s
[Parallel(n_jobs=10)]: Done  50 out of  50 | elapsed:    0.0s finished


['interceptions', 'jumping', 'long_shots', 'marking', 'penalties', 'positioning', 'sliding_tackle', 'standing_tackle', 'vision', 'volleys', 'height_cm', 'weight_kgs', 'age', 'start_x', 'start_y', 'distance_to_goal', 'angle_to_goal', 'distance_opponent', 'num_opponent_closer_goal', 'num_opponent_in_path']
['agility', 'balance', 'finishing', 'interceptions', 'marking', 'penalties', 'sliding_tackle', 'standing_tackle', 'vision', 'volleys', 'height_cm', 'weight_kgs', 'age', 'start_x', 'start_y', 'distance_to_goal', 'angle_to_goal', 'distance_opponent', 'num_opponent_closer_goal', 'num_opponent_in_path']
Learning rate set to 0.26142
0:	learn: 0.6274589	total: 1.71ms	remaining: 83.7ms
1:	learn: 0.5922234	total: 3.44ms	remaining: 82.4ms
2:	learn: 0.5723510	total: 4.76ms	remaining: 74.5ms
3:	learn: 0.5578714	total: 5.96ms	remaining: 68.5ms
4:	learn: 0.5463427	total: 7.22ms	remaining: 64.9ms
5:	learn: 0.5336380	total: 8.35ms	remaining: 61.2ms
6:	learn: 0.5241308	total: 9.93ms	remaining: 61ms
7:

[Parallel(n_jobs=-3)]: Using backend ThreadingBackend with 10 concurrent workers.
[Parallel(n_jobs=-3)]: Done  30 tasks      | elapsed:    0.0s
[Parallel(n_jobs=-3)]: Done  50 out of  50 | elapsed:    0.0s finished
[Parallel(n_jobs=10)]: Using backend ThreadingBackend with 10 concurrent workers.
[Parallel(n_jobs=10)]: Done  30 tasks      | elapsed:    0.0s
[Parallel(n_jobs=10)]: Done  50 out of  50 | elapsed:    0.0s finished


['acceleration', 'aggression', 'agility', 'dribbling', 'interceptions', 'long_shots', 'marking', 'sliding_tackle', 'standing_tackle', 'volleys', 'height_cm', 'weight_kgs', 'age', 'start_x', 'start_y', 'distance_to_goal', 'angle_to_goal', 'distance_opponent', 'num_opponent_closer_goal', 'num_opponent_in_path']


100%|██████████| 10/10 [00:00<00:00, 68.00it/s]


['composure', 'finishing', 'interceptions', 'jumping', 'marking', 'penalties', 'positioning', 'sliding_tackle', 'standing_tackle', 'volleys', 'height_cm', 'weight_kgs', 'age', 'start_x', 'start_y', 'distance_to_goal', 'angle_to_goal', 'distance_opponent', 'num_opponent_closer_goal', 'num_opponent_in_path']


100%|██████████| 10/10 [00:00<00:00, 53.51it/s]


['composure', 'finishing', 'interceptions', 'jumping', 'marking', 'penalties', 'positioning', 'sliding_tackle', 'standing_tackle', 'volleys', 'height_cm', 'weight_kgs', 'age', 'start_x', 'start_y', 'distance_to_goal', 'angle_to_goal', 'distance_opponent', 'num_opponent_closer_goal', 'num_opponent_in_path']
Learning rate set to 0.26142
0:	learn: 0.6274589	total: 1.37ms	remaining: 67.4ms
1:	learn: 0.5922234	total: 2.82ms	remaining: 67.7ms
2:	learn: 0.5763836	total: 4.02ms	remaining: 63ms
3:	learn: 0.5618192	total: 5.22ms	remaining: 60ms
4:	learn: 0.5458981	total: 6.25ms	remaining: 56.2ms
5:	learn: 0.5377551	total: 7.51ms	remaining: 55.1ms
6:	learn: 0.5288562	total: 8.93ms	remaining: 54.8ms
7:	learn: 0.5251052	total: 10.3ms	remaining: 54.1ms
8:	learn: 0.5143999	total: 11.6ms	remaining: 52.7ms
9:	learn: 0.5123468	total: 12.9ms	remaining: 51.5ms
10:	learn: 0.5081910	total: 14.2ms	remaining: 50.3ms
11:	learn: 0.5036066	total: 15.4ms	remaining: 48.9ms
12:	learn: 0.4999111	total: 16.8ms	remain

100%|██████████| 10/10 [00:00<00:00, 61.95it/s]
[Parallel(n_jobs=-3)]: Using backend ThreadingBackend with 10 concurrent workers.
[Parallel(n_jobs=-3)]: Done  30 tasks      | elapsed:    0.0s
[Parallel(n_jobs=-3)]: Done  50 out of  50 | elapsed:    0.0s finished
[Parallel(n_jobs=10)]: Using backend ThreadingBackend with 10 concurrent workers.
[Parallel(n_jobs=10)]: Done  30 tasks      | elapsed:    0.0s
[Parallel(n_jobs=10)]: Done  50 out of  50 | elapsed:    0.0s finished


['composure', 'finishing', 'interceptions', 'jumping', 'marking', 'penalties', 'positioning', 'sliding_tackle', 'standing_tackle', 'volleys', 'height_cm', 'weight_kgs', 'age', 'start_x', 'start_y', 'distance_to_goal', 'angle_to_goal', 'distance_opponent', 'num_opponent_closer_goal', 'num_opponent_in_path']
['acceleration', 'heading_accuracy', 'interceptions', 'jumping', 'marking', 'penalties', 'shot_power', 'sliding_tackle', 'standing_tackle', 'volleys', 'height_cm', 'weight_kgs', 'age', 'start_x', 'start_y', 'distance_to_goal', 'angle_to_goal', 'distance_opponent', 'num_opponent_closer_goal', 'num_opponent_in_path']
['acceleration', 'heading_accuracy', 'interceptions', 'jumping', 'marking', 'penalties', 'shot_power', 'sliding_tackle', 'standing_tackle', 'volleys', 'height_cm', 'weight_kgs', 'age', 'start_x', 'start_y', 'distance_to_goal', 'angle_to_goal', 'distance_opponent', 'num_opponent_closer_goal', 'num_opponent_in_path']
Learning rate set to 0.26142
0:	learn: 0.6274589	total: 1.

[Parallel(n_jobs=-3)]: Using backend ThreadingBackend with 10 concurrent workers.
[Parallel(n_jobs=-3)]: Done  30 tasks      | elapsed:    0.0s
[Parallel(n_jobs=-3)]: Done  50 out of  50 | elapsed:    0.0s finished
[Parallel(n_jobs=10)]: Using backend ThreadingBackend with 10 concurrent workers.
[Parallel(n_jobs=10)]: Done  30 tasks      | elapsed:    0.0s
[Parallel(n_jobs=10)]: Done  50 out of  50 | elapsed:    0.0s finished


12:	learn: 0.4910298	total: 17.5ms	remaining: 49.7ms
13:	learn: 0.4859899	total: 18.8ms	remaining: 48.3ms
14:	learn: 0.4844163	total: 20ms	remaining: 46.7ms
15:	learn: 0.4823085	total: 21.3ms	remaining: 45.3ms
16:	learn: 0.4798977	total: 22.7ms	remaining: 44.1ms
17:	learn: 0.4760986	total: 24ms	remaining: 42.7ms
18:	learn: 0.4724404	total: 25.4ms	remaining: 41.5ms
19:	learn: 0.4708103	total: 26.7ms	remaining: 40.1ms
20:	learn: 0.4664293	total: 28.1ms	remaining: 38.8ms
21:	learn: 0.4640074	total: 29.4ms	remaining: 37.4ms
22:	learn: 0.4614090	total: 30.6ms	remaining: 36ms
23:	learn: 0.4578107	total: 31.9ms	remaining: 34.6ms
24:	learn: 0.4546223	total: 33.2ms	remaining: 33.2ms
25:	learn: 0.4520767	total: 34.6ms	remaining: 31.9ms
26:	learn: 0.4484255	total: 36ms	remaining: 30.7ms
27:	learn: 0.4443543	total: 37.3ms	remaining: 29.3ms
28:	learn: 0.4425001	total: 38.9ms	remaining: 28.2ms
29:	learn: 0.4393844	total: 40.4ms	remaining: 26.9ms
30:	learn: 0.4350563	total: 41.8ms	remaining: 25.6ms
3

[Parallel(n_jobs=-3)]: Using backend ThreadingBackend with 10 concurrent workers.
[Parallel(n_jobs=-3)]: Done  30 tasks      | elapsed:    0.0s
[Parallel(n_jobs=-3)]: Done  50 out of  50 | elapsed:    0.0s finished
[Parallel(n_jobs=10)]: Using backend ThreadingBackend with 10 concurrent workers.
[Parallel(n_jobs=10)]: Done  30 tasks      | elapsed:    0.0s
[Parallel(n_jobs=10)]: Done  50 out of  50 | elapsed:    0.0s finished


['height_cm', 'weight_kgs', 'age', 'start_x', 'start_y', 'distance_to_goal', 'angle_to_goal', 'distance_opponent', 'num_opponent_closer_goal', 'num_opponent_in_path']
Learning rate set to 0.116403
0:	learn: 0.6671976	total: 427us	remaining: 21ms
1:	learn: 0.6457298	total: 805us	remaining: 19.3ms
2:	learn: 0.6265955	total: 1.25ms	remaining: 19.6ms
3:	learn: 0.6109086	total: 1.61ms	remaining: 18.6ms
4:	learn: 0.6000697	total: 1.94ms	remaining: 17.5ms
5:	learn: 0.5893610	total: 2.33ms	remaining: 17.1ms
6:	learn: 0.5821532	total: 2.67ms	remaining: 16.4ms
7:	learn: 0.5743187	total: 3.04ms	remaining: 16ms
8:	learn: 0.5681819	total: 3.4ms	remaining: 15.5ms
9:	learn: 0.5625494	total: 3.75ms	remaining: 15ms
10:	learn: 0.5577186	total: 4.09ms	remaining: 14.5ms
11:	learn: 0.5531596	total: 4.57ms	remaining: 14.5ms
12:	learn: 0.5499037	total: 5ms	remaining: 14.2ms
13:	learn: 0.5448464	total: 5.39ms	remaining: 13.9ms
14:	learn: 0.5413510	total: 5.82ms	remaining: 13.6ms
15:	learn: 0.5376695	total: 6.

[Parallel(n_jobs=-3)]: Using backend ThreadingBackend with 10 concurrent workers.
[Parallel(n_jobs=-3)]: Done  30 tasks      | elapsed:    0.0s
[Parallel(n_jobs=-3)]: Done  50 out of  50 | elapsed:    0.0s finished
[Parallel(n_jobs=10)]: Using backend ThreadingBackend with 10 concurrent workers.
[Parallel(n_jobs=10)]: Done  30 tasks      | elapsed:    0.0s
[Parallel(n_jobs=10)]: Done  50 out of  50 | elapsed:    0.0s finished


['finishing', 'interceptions', 'marking', 'penalties', 'positioning', 'reactions', 'shot_power', 'sliding_tackle', 'standing_tackle', 'volleys', 'height_cm', 'weight_kgs', 'age', 'start_x', 'start_y', 'distance_to_goal', 'angle_to_goal', 'distance_opponent', 'num_opponent_closer_goal', 'num_opponent_in_path']
Learning rate set to 0.116403
0:	learn: 0.6645827	total: 1.23ms	remaining: 60.4ms
1:	learn: 0.6402265	total: 2.42ms	remaining: 58.1ms
2:	learn: 0.6180704	total: 3.54ms	remaining: 55.4ms
3:	learn: 0.6008626	total: 4.56ms	remaining: 52.5ms
4:	learn: 0.5868205	total: 5.51ms	remaining: 49.6ms
5:	learn: 0.5696815	total: 6.39ms	remaining: 46.8ms
6:	learn: 0.5588355	total: 7.3ms	remaining: 44.9ms
7:	learn: 0.5511524	total: 8.19ms	remaining: 43ms
8:	learn: 0.5428800	total: 9.07ms	remaining: 41.3ms
9:	learn: 0.5384734	total: 9.96ms	remaining: 39.8ms
10:	learn: 0.5326230	total: 10.8ms	remaining: 38.4ms
11:	learn: 0.5256483	total: 11.7ms	remaining: 37ms
12:	learn: 0.5194810	total: 12.6ms	rem

[Parallel(n_jobs=-3)]: Using backend ThreadingBackend with 10 concurrent workers.
[Parallel(n_jobs=-3)]: Done  30 tasks      | elapsed:    0.0s
[Parallel(n_jobs=-3)]: Done  50 out of  50 | elapsed:    0.0s finished
[Parallel(n_jobs=10)]: Using backend ThreadingBackend with 10 concurrent workers.
[Parallel(n_jobs=10)]: Done  30 tasks      | elapsed:    0.0s
[Parallel(n_jobs=10)]: Done  50 out of  50 | elapsed:    0.0s finished


['ball_control', 'composure', 'curve', 'finishing', 'freekick_accuracy', 'jumping', 'long_passing', 'marking', 'shot_power', 'standing_tackle', 'height_cm', 'weight_kgs', 'age', 'start_x', 'start_y', 'distance_to_goal', 'angle_to_goal', 'distance_opponent', 'num_opponent_closer_goal', 'num_opponent_in_path']
['acceleration', 'balance', 'ball_control', 'composure', 'dribbling', 'freekick_accuracy', 'marking', 'sliding_tackle', 'sprint_speed', 'standing_tackle', 'height_cm', 'weight_kgs', 'age', 'start_x', 'start_y', 'distance_to_goal', 'angle_to_goal', 'distance_opponent', 'num_opponent_closer_goal', 'num_opponent_in_path']
Learning rate set to 0.116403
0:	learn: 0.6631139	total: 1.18ms	remaining: 57.8ms
1:	learn: 0.6373873	total: 2.17ms	remaining: 52.1ms
2:	learn: 0.6137775	total: 3.15ms	remaining: 49.4ms
3:	learn: 0.5950589	total: 4.16ms	remaining: 47.9ms
4:	learn: 0.5838787	total: 5.29ms	remaining: 47.6ms
5:	learn: 0.5741943	total: 6.53ms	remaining: 47.9ms
6:	learn: 0.5630263	total: 

[Parallel(n_jobs=-3)]: Using backend ThreadingBackend with 10 concurrent workers.
[Parallel(n_jobs=-3)]: Done  30 tasks      | elapsed:    0.0s
[Parallel(n_jobs=-3)]: Done  50 out of  50 | elapsed:    0.0s finished
[Parallel(n_jobs=10)]: Using backend ThreadingBackend with 10 concurrent workers.
[Parallel(n_jobs=10)]: Done  30 tasks      | elapsed:    0.0s
[Parallel(n_jobs=10)]: Done  50 out of  50 | elapsed:    0.0s finished
100%|██████████| 10/10 [00:00<00:00, 65.41it/s]


['finishing', 'interceptions', 'jumping', 'marking', 'penalties', 'positioning', 'reactions', 'sliding_tackle', 'standing_tackle', 'vision', 'height_cm', 'weight_kgs', 'age', 'start_x', 'start_y', 'distance_to_goal', 'angle_to_goal', 'distance_opponent', 'num_opponent_closer_goal', 'num_opponent_in_path']


100%|██████████| 10/10 [00:00<00:00, 55.61it/s]


['finishing', 'interceptions', 'jumping', 'marking', 'penalties', 'positioning', 'reactions', 'sliding_tackle', 'standing_tackle', 'vision', 'height_cm', 'weight_kgs', 'age', 'start_x', 'start_y', 'distance_to_goal', 'angle_to_goal', 'distance_opponent', 'num_opponent_closer_goal', 'num_opponent_in_path']
Learning rate set to 0.116403
0:	learn: 0.6638227	total: 1.11ms	remaining: 54.4ms
1:	learn: 0.6383987	total: 2.28ms	remaining: 54.7ms
2:	learn: 0.6163348	total: 3.11ms	remaining: 48.7ms
3:	learn: 0.5990990	total: 3.9ms	remaining: 44.9ms
4:	learn: 0.5859191	total: 4.71ms	remaining: 42.4ms
5:	learn: 0.5757831	total: 5.5ms	remaining: 40.3ms
6:	learn: 0.5624652	total: 6.47ms	remaining: 39.7ms
7:	learn: 0.5548559	total: 7.27ms	remaining: 38.2ms
8:	learn: 0.5451987	total: 8.05ms	remaining: 36.7ms
9:	learn: 0.5404125	total: 8.91ms	remaining: 35.7ms
10:	learn: 0.5361024	total: 9.74ms	remaining: 34.5ms
11:	learn: 0.5283123	total: 10.6ms	remaining: 33.4ms
12:	learn: 0.5192293	total: 11.3ms	rema

100%|██████████| 10/10 [00:00<00:00, 60.93it/s]
[Parallel(n_jobs=-3)]: Using backend ThreadingBackend with 10 concurrent workers.
[Parallel(n_jobs=-3)]: Done  30 tasks      | elapsed:    0.0s
[Parallel(n_jobs=-3)]: Done  50 out of  50 | elapsed:    0.0s finished
[Parallel(n_jobs=10)]: Using backend ThreadingBackend with 10 concurrent workers.
[Parallel(n_jobs=10)]: Done  30 tasks      | elapsed:    0.0s
[Parallel(n_jobs=10)]: Done  50 out of  50 | elapsed:    0.0s finished


['finishing', 'interceptions', 'jumping', 'marking', 'penalties', 'positioning', 'reactions', 'sliding_tackle', 'standing_tackle', 'vision', 'height_cm', 'weight_kgs', 'age', 'start_x', 'start_y', 'distance_to_goal', 'angle_to_goal', 'distance_opponent', 'num_opponent_closer_goal', 'num_opponent_in_path']
['curve', 'heading_accuracy', 'interceptions', 'jumping', 'marking', 'penalties', 'positioning', 'stamina', 'standing_tackle', 'volleys', 'height_cm', 'weight_kgs', 'age', 'start_x', 'start_y', 'distance_to_goal', 'angle_to_goal', 'distance_opponent', 'num_opponent_closer_goal', 'num_opponent_in_path']
['acceleration', 'heading_accuracy', 'interceptions', 'jumping', 'marking', 'penalties', 'sprint_speed', 'stamina', 'standing_tackle', 'volleys', 'height_cm', 'weight_kgs', 'age', 'start_x', 'start_y', 'distance_to_goal', 'angle_to_goal', 'distance_opponent', 'num_opponent_closer_goal', 'num_opponent_in_path']
Learning rate set to 0.116403
0:	learn: 0.6675585	total: 1ms	remaining: 49ms


[Parallel(n_jobs=-3)]: Using backend ThreadingBackend with 10 concurrent workers.
[Parallel(n_jobs=-3)]: Done  30 tasks      | elapsed:    0.0s
[Parallel(n_jobs=-3)]: Done  50 out of  50 | elapsed:    0.0s finished
[Parallel(n_jobs=10)]: Using backend ThreadingBackend with 10 concurrent workers.
[Parallel(n_jobs=10)]: Done  30 tasks      | elapsed:    0.0s
[Parallel(n_jobs=10)]: Done  50 out of  50 | elapsed:    0.0s finished


42:	learn: 0.4526093	total: 37.9ms	remaining: 6.16ms
43:	learn: 0.4505582	total: 38.7ms	remaining: 5.28ms
44:	learn: 0.4481900	total: 39.8ms	remaining: 4.42ms
45:	learn: 0.4463933	total: 40.7ms	remaining: 3.54ms
46:	learn: 0.4432159	total: 41.6ms	remaining: 2.65ms
47:	learn: 0.4423605	total: 42.5ms	remaining: 1.77ms
48:	learn: 0.4413500	total: 43.4ms	remaining: 884us
49:	learn: 0.4409025	total: 44.2ms	remaining: 0us
['finishing', 'interceptions', 'jumping', 'long_shots', 'marking', 'penalties', 'positioning', 'reactions', 'stamina', 'short_passing', 'height_cm', 'weight_kgs', 'age', 'start_x', 'start_y', 'distance_to_goal', 'angle_to_goal', 'distance_opponent', 'num_opponent_closer_goal', 'num_opponent_in_path']


[Parallel(n_jobs=-3)]: Using backend ThreadingBackend with 10 concurrent workers.
[Parallel(n_jobs=-3)]: Done  30 tasks      | elapsed:    0.0s
[Parallel(n_jobs=-3)]: Done  50 out of  50 | elapsed:    0.0s finished
[Parallel(n_jobs=10)]: Using backend ThreadingBackend with 10 concurrent workers.
[Parallel(n_jobs=10)]: Done  30 tasks      | elapsed:    0.0s
[Parallel(n_jobs=10)]: Done  50 out of  50 | elapsed:    0.0s finished


['height_cm', 'weight_kgs', 'age', 'start_x', 'start_y', 'distance_to_goal', 'angle_to_goal', 'distance_opponent', 'num_opponent_closer_goal', 'num_opponent_in_path']
['height_cm', 'weight_kgs', 'age', 'start_x', 'start_y', 'distance_to_goal', 'angle_to_goal', 'distance_opponent', 'num_opponent_closer_goal', 'num_opponent_in_path']
Learning rate set to 0.26142
0:	learn: 0.6269810	total: 877us	remaining: 43ms
1:	learn: 0.5906731	total: 1.58ms	remaining: 37.8ms
2:	learn: 0.5652399	total: 2.37ms	remaining: 37.1ms
3:	learn: 0.5434760	total: 3.17ms	remaining: 36.5ms
4:	learn: 0.5319899	total: 3.79ms	remaining: 34.1ms
5:	learn: 0.5231162	total: 4.49ms	remaining: 33ms
6:	learn: 0.5161394	total: 5.17ms	remaining: 31.8ms
7:	learn: 0.5109620	total: 5.84ms	remaining: 30.7ms
8:	learn: 0.5034046	total: 6.49ms	remaining: 29.6ms
9:	learn: 0.4998919	total: 7.21ms	remaining: 28.8ms
10:	learn: 0.4941675	total: 8.01ms	remaining: 28.4ms
11:	learn: 0.4909846	total: 8.89ms	remaining: 28.2ms
12:	learn: 0.487

[Parallel(n_jobs=-3)]: Using backend ThreadingBackend with 10 concurrent workers.
[Parallel(n_jobs=-3)]: Done  30 tasks      | elapsed:    0.0s
[Parallel(n_jobs=-3)]: Done  50 out of  50 | elapsed:    0.0s finished
[Parallel(n_jobs=10)]: Using backend ThreadingBackend with 10 concurrent workers.
[Parallel(n_jobs=10)]: Done  30 tasks      | elapsed:    0.0s
[Parallel(n_jobs=10)]: Done  50 out of  50 | elapsed:    0.0s finished


['finishing', 'freekick_accuracy', 'interceptions', 'marking', 'penalties', 'positioning', 'sliding_tackle', 'standing_tackle', 'vision', 'volleys', 'height_cm', 'weight_kgs', 'age', 'start_x', 'start_y', 'distance_to_goal', 'angle_to_goal', 'distance_opponent', 'num_opponent_closer_goal', 'num_opponent_in_path']
['curve', 'finishing', 'freekick_accuracy', 'interceptions', 'marking', 'penalties', 'positioning', 'sliding_tackle', 'standing_tackle', 'volleys', 'height_cm', 'weight_kgs', 'age', 'start_x', 'start_y', 'distance_to_goal', 'angle_to_goal', 'distance_opponent', 'num_opponent_closer_goal', 'num_opponent_in_path']
Learning rate set to 0.26142
0:	learn: 0.6162540	total: 1.84ms	remaining: 90.4ms
1:	learn: 0.5753259	total: 3.14ms	remaining: 75.3ms
2:	learn: 0.5483029	total: 4.54ms	remaining: 71.1ms
3:	learn: 0.5289215	total: 6.42ms	remaining: 73.8ms
4:	learn: 0.5143234	total: 8.42ms	remaining: 75.8ms
5:	learn: 0.5062488	total: 10.2ms	remaining: 74.8ms
6:	learn: 0.4976086	total: 11.

[Parallel(n_jobs=-3)]: Using backend ThreadingBackend with 10 concurrent workers.
[Parallel(n_jobs=-3)]: Done  30 tasks      | elapsed:    0.0s
[Parallel(n_jobs=-3)]: Done  50 out of  50 | elapsed:    0.0s finished
[Parallel(n_jobs=10)]: Using backend ThreadingBackend with 10 concurrent workers.
[Parallel(n_jobs=10)]: Done  30 tasks      | elapsed:    0.0s
[Parallel(n_jobs=10)]: Done  50 out of  50 | elapsed:    0.0s finished


['acceleration', 'aggression', 'balance', 'composure', 'heading_accuracy', 'jumping', 'penalties', 'reactions', 'shot_power', 'sliding_tackle', 'height_cm', 'weight_kgs', 'age', 'start_x', 'start_y', 'distance_to_goal', 'angle_to_goal', 'distance_opponent', 'num_opponent_closer_goal', 'num_opponent_in_path']
['acceleration', 'ball_control', 'composure', 'heading_accuracy', 'interceptions', 'jumping', 'long_shots', 'marking', 'reactions', 'short_passing', 'height_cm', 'weight_kgs', 'age', 'start_x', 'start_y', 'distance_to_goal', 'angle_to_goal', 'distance_opponent', 'num_opponent_closer_goal', 'num_opponent_in_path']
Learning rate set to 0.26142
0:	learn: 0.6283959	total: 1.76ms	remaining: 86.3ms
1:	learn: 0.5897613	total: 2.94ms	remaining: 70.7ms
2:	learn: 0.5632894	total: 4.21ms	remaining: 66ms
3:	learn: 0.5390462	total: 5.62ms	remaining: 64.6ms
4:	learn: 0.5248493	total: 6.71ms	remaining: 60.4ms
5:	learn: 0.5139278	total: 7.89ms	remaining: 57.9ms
6:	learn: 0.4969185	total: 9.13ms	re

[Parallel(n_jobs=-3)]: Using backend ThreadingBackend with 10 concurrent workers.
[Parallel(n_jobs=-3)]: Done  30 tasks      | elapsed:    0.0s
[Parallel(n_jobs=-3)]: Done  50 out of  50 | elapsed:    0.0s finished
[Parallel(n_jobs=10)]: Using backend ThreadingBackend with 10 concurrent workers.
[Parallel(n_jobs=10)]: Done  30 tasks      | elapsed:    0.0s
[Parallel(n_jobs=10)]: Done  50 out of  50 | elapsed:    0.0s finished


['acceleration', 'agility', 'ball_control', 'composure', 'heading_accuracy', 'jumping', 'penalties', 'reactions', 'stamina', 'volleys', 'height_cm', 'weight_kgs', 'age', 'start_x', 'start_y', 'distance_to_goal', 'angle_to_goal', 'distance_opponent', 'num_opponent_closer_goal', 'num_opponent_in_path']


100%|██████████| 10/10 [00:00<00:00, 60.20it/s]


['heading_accuracy', 'interceptions', 'jumping', 'marking', 'penalties', 'positioning', 'sliding_tackle', 'standing_tackle', 'vision', 'volleys', 'height_cm', 'weight_kgs', 'age', 'start_x', 'start_y', 'distance_to_goal', 'angle_to_goal', 'distance_opponent', 'num_opponent_closer_goal', 'num_opponent_in_path']


100%|██████████| 10/10 [00:00<00:00, 52.61it/s]


['composure', 'finishing', 'interceptions', 'marking', 'penalties', 'positioning', 'sliding_tackle', 'standing_tackle', 'strength', 'volleys', 'height_cm', 'weight_kgs', 'age', 'start_x', 'start_y', 'distance_to_goal', 'angle_to_goal', 'distance_opponent', 'num_opponent_closer_goal', 'num_opponent_in_path']
Learning rate set to 0.26142
0:	learn: 0.6136643	total: 2.68ms	remaining: 131ms
1:	learn: 0.5723137	total: 4.22ms	remaining: 101ms
2:	learn: 0.5437947	total: 5.94ms	remaining: 93.1ms
3:	learn: 0.5287441	total: 7.66ms	remaining: 88ms
4:	learn: 0.5158685	total: 9.01ms	remaining: 81.1ms
5:	learn: 0.5006908	total: 10.5ms	remaining: 77ms
6:	learn: 0.4918284	total: 12.2ms	remaining: 74.7ms
7:	learn: 0.4844125	total: 13.9ms	remaining: 73.2ms
8:	learn: 0.4798655	total: 15.7ms	remaining: 71.3ms
9:	learn: 0.4745881	total: 17.1ms	remaining: 68.3ms
10:	learn: 0.4710474	total: 18.7ms	remaining: 66.3ms
11:	learn: 0.4682543	total: 20.1ms	remaining: 63.6ms
12:	learn: 0.4635531	total: 21.6ms	remaini

100%|██████████| 10/10 [00:00<00:00, 56.74it/s]
[Parallel(n_jobs=-3)]: Using backend ThreadingBackend with 10 concurrent workers.
[Parallel(n_jobs=-3)]: Done  30 tasks      | elapsed:    0.0s
[Parallel(n_jobs=-3)]: Done  50 out of  50 | elapsed:    0.0s finished
[Parallel(n_jobs=10)]: Using backend ThreadingBackend with 10 concurrent workers.
[Parallel(n_jobs=10)]: Done  30 tasks      | elapsed:    0.0s
[Parallel(n_jobs=10)]: Done  50 out of  50 | elapsed:    0.0s finished


['dribbling', 'heading_accuracy', 'interceptions', 'marking', 'penalties', 'positioning', 'sliding_tackle', 'standing_tackle', 'vision', 'volleys', 'height_cm', 'weight_kgs', 'age', 'start_x', 'start_y', 'distance_to_goal', 'angle_to_goal', 'distance_opponent', 'num_opponent_closer_goal', 'num_opponent_in_path']
['acceleration', 'freekick_accuracy', 'interceptions', 'jumping', 'long_shots', 'marking', 'sliding_tackle', 'sprint_speed', 'stamina', 'standing_tackle', 'height_cm', 'weight_kgs', 'age', 'start_x', 'start_y', 'distance_to_goal', 'angle_to_goal', 'distance_opponent', 'num_opponent_closer_goal', 'num_opponent_in_path']
['acceleration', 'aggression', 'jumping', 'long_shots', 'marking', 'penalties', 'sliding_tackle', 'sprint_speed', 'standing_tackle', 'strength', 'height_cm', 'weight_kgs', 'age', 'start_x', 'start_y', 'distance_to_goal', 'angle_to_goal', 'distance_opponent', 'num_opponent_closer_goal', 'num_opponent_in_path']
Learning rate set to 0.26142
0:	learn: 0.6230419	total

[Parallel(n_jobs=-3)]: Using backend ThreadingBackend with 10 concurrent workers.
[Parallel(n_jobs=-3)]: Done  30 tasks      | elapsed:    0.0s
[Parallel(n_jobs=-3)]: Done  50 out of  50 | elapsed:    0.0s finished
[Parallel(n_jobs=10)]: Using backend ThreadingBackend with 10 concurrent workers.
[Parallel(n_jobs=10)]: Done  30 tasks      | elapsed:    0.0s
[Parallel(n_jobs=10)]: Done  50 out of  50 | elapsed:    0.0s finished


['acceleration', 'agility', 'dribbling', 'jumping', 'long_shots', 'marking', 'penalties', 'reactions', 'short_passing', 'strength', 'height_cm', 'weight_kgs', 'age', 'start_x', 'start_y', 'distance_to_goal', 'angle_to_goal', 'distance_opponent', 'num_opponent_closer_goal', 'num_opponent_in_path']
Learning rate set to 0.26142
0:	learn: 0.6194358	total: 2.17ms	remaining: 106ms
1:	learn: 0.5767946	total: 3.76ms	remaining: 90.3ms
2:	learn: 0.5494053	total: 5.17ms	remaining: 80.9ms
3:	learn: 0.5333863	total: 6.53ms	remaining: 75.1ms
4:	learn: 0.5169783	total: 8.12ms	remaining: 73ms
5:	learn: 0.5040369	total: 9.6ms	remaining: 70.4ms
6:	learn: 0.4957301	total: 11ms	remaining: 67.9ms
7:	learn: 0.4891660	total: 12.4ms	remaining: 64.9ms
8:	learn: 0.4820617	total: 13.6ms	remaining: 61.8ms
9:	learn: 0.4772486	total: 15.1ms	remaining: 60.3ms
10:	learn: 0.4734555	total: 16.6ms	remaining: 58.9ms
11:	learn: 0.4700305	total: 18.1ms	remaining: 57.5ms
12:	learn: 0.4642258	total: 19.6ms	remaining: 55.8ms


[Parallel(n_jobs=-3)]: Using backend ThreadingBackend with 10 concurrent workers.
[Parallel(n_jobs=-3)]: Done  30 tasks      | elapsed:    0.0s
[Parallel(n_jobs=-3)]: Done  50 out of  50 | elapsed:    0.0s finished
[Parallel(n_jobs=10)]: Using backend ThreadingBackend with 10 concurrent workers.
[Parallel(n_jobs=10)]: Done  30 tasks      | elapsed:    0.0s
[Parallel(n_jobs=10)]: Done  50 out of  50 | elapsed:    0.0s finished
