# Synchronize data to Google Drive
This notebook guides you through the process of synchronizing the data to your Google Drive account.

In [0]:
%load_ext autoreload
%autoreload 2

# Import standard module
import os

# Import boto3 module
import boto3

# Import Google Colab function
from google.colab import drive

In [0]:
# Access your Google Drive account
mount_point = '/content/gdrive'
drive.mount(mount_point)

In [0]:
drive_folder = 'My Drive'
directory = 'Wyscout'
path = os.path.join(mount_point, drive_folder, directory)

In [0]:
# Provide credentials for Amazon S3
AWS_ACCESS_KEY_ID = ''  # Enter the AWS Access Key
AWS_SECRET_ACCESS_KEY = ''  # Enter the AWS Secret Access Key

In [0]:
# Connect to the S3 bucket that contains the data
session = boto3.Session(
    aws_access_key_id=AWS_ACCESS_KEY_ID,
    aws_secret_access_key=AWS_SECRET_ACCESS_KEY,
)

s3 = session.resource('s3')
bucket = s3.Bucket('ssda-master-class-sports-analytics')

In [0]:
# Copy the data for selected seasons from the S3 bucket to Google Drive
# season_ids = [10992, 181334, 185611]  # Eredivisie 2016/2017 - 2018/2019
# season_ids = [10883, 181150, 185618]  # Premier League 2016/2017 - 2018/2019
season_ids = [10883, 10992, 181150, 181334, 185611, 185618]  # Eredivisie 2016/2017 - 2018/2019 + Premier League 2016/2017 - 2018/2019

file_names = ['actions.h5', 'matches.h5', 'players.h5', 'teams.h5']

!mkdir -p '{path}'
bucket.download_file(f'competitions.h5', f'{path}/competitions.h5')
bucket.download_file(f'seasons.h5', f'{path}/seasons.h5')

for season_id in season_ids:
  !mkdir -p '{path}/season-{season_id}'
  for file_name in file_names:
    bucket.download_file(f'season-{season_id}/{file_name}', f'{path}/season-{season_id}/{file_name}')

In [0]:
drive.mount(mount_point, force_remount=True)