In [1]:
import pandas as pd
import numpy as np
import os
import zipfile
import shutil
import filecmp

In [4]:
def extract_zip_files(main_zipfile, destination_folder):
    """
    Extracting Nested ZipFiles.

    Parameters:
    main_zipfile (str): The path to the main(root) zipfile.
    destination_folder (str): The path to where extracted files should be placed.
    
    """
    # Making a destination directory 
    if not os.path.exists(destination_folder):
        os.makedirs(destination_folder)

    # Extract the main zip file
    with zipfile.ZipFile(main_zipfile, 'r') as main_zip:
        main_zip.extractall(destination_folder)

    # Creating a list of zipfiles inside the main one
    nested_zip_files = [os.path.join(destination_folder, filename) for filename in os.listdir(destination_folder) if filename.endswith('.zip')]

    for nested_zip in nested_zip_files:
        # Create a directory with the same name as the zip file
        nested_destination = os.path.join(destination_folder, os.path.splitext(os.path.basename(nested_zip))[0])
        os.makedirs(nested_destination, exist_ok=True)

        # Extract all the nested zipfiles
        with zipfile.ZipFile(nested_zip, 'r') as nested_zipfile:
            nested_zipfile.extractall(nested_destination)

extract_zip_files('../Raw_Data/202405.zip', '../Raw_Data/raw_data')

In [7]:
def collect_files(source_root, destination_folder, target_subdir, target_filename_prefix):
    """
    Create directories based on the given schema and gather all data from the same category in each directory.
    Remove duplicates if found.

    Parameters:
    source_root (str): Directory that has all the 31 days data.
    destination_folder (str): Directory to collect the files from the same category into.
    target_subdir (str): The directory where we can find desired files.
    target_filename_prefix (str): Prefix of the files to collect.
    """
    
    # Make the destination directory if it doesn't exist
    if not os.path.exists(destination_folder):
        os.makedirs(destination_folder)

    # Explore the directory structure
    for root, dirs, files in os.walk(source_root):
        # Check if the current directory is the target directory
        if os.path.basename(root) == target_subdir:
            # Copy the files to the destination folder
            for file in files:
                if file.startswith(target_filename_prefix):
                    source_file_path = os.path.join(root, file)
                    destination_file_path = os.path.join(destination_folder, file)
                    
                    # Check if the file already exists in the destination folder
                    if os.path.exists(destination_file_path):
                        os.remove(source_file_path)
                    else:
                        shutil.move(source_file_path, destination_file_path)
                        print(f"Copied {source_file_path} to {destination_file_path}")

# Example usage
source_root = "../Raw_Data/"  # Directory that has all the 31 days data
destination_folder = "../Data/Venue"  # Folder to collect the files into
target_subdir = "raw_match_parquet"  # Target subdirectory
target_filename_prefix = "venue"  # Prefix of the files to collect

collect_files(source_root, destination_folder, target_subdir, target_filename_prefix)


Copied ../Raw_Data/raw_data\20240501\data\raw\raw_match_parquet\venue_12260075.parquet to ../Data/Venue\venue_12260075.parquet
Copied ../Raw_Data/raw_data\20240501\data\raw\raw_match_parquet\venue_12260076.parquet to ../Data/Venue\venue_12260076.parquet
Copied ../Raw_Data/raw_data\20240501\data\raw\raw_match_parquet\venue_12260077.parquet to ../Data/Venue\venue_12260077.parquet
Copied ../Raw_Data/raw_data\20240501\data\raw\raw_match_parquet\venue_12260078.parquet to ../Data/Venue\venue_12260078.parquet
Copied ../Raw_Data/raw_data\20240501\data\raw\raw_match_parquet\venue_12260080.parquet to ../Data/Venue\venue_12260080.parquet
Copied ../Raw_Data/raw_data\20240501\data\raw\raw_match_parquet\venue_12260081.parquet to ../Data/Venue\venue_12260081.parquet
Copied ../Raw_Data/raw_data\20240501\data\raw\raw_match_parquet\venue_12260085.parquet to ../Data/Venue\venue_12260085.parquet
Copied ../Raw_Data/raw_data\20240501\data\raw\raw_match_parquet\venue_12261594.parquet to ../Data/Venue\venue_1

Copied ../Raw_Data/raw_data\20240501\data\raw\raw_match_parquet\venue_12295428.parquet to ../Data/Venue\venue_12295428.parquet
Copied ../Raw_Data/raw_data\20240501\data\raw\raw_match_parquet\venue_12295429.parquet to ../Data/Venue\venue_12295429.parquet
Copied ../Raw_Data/raw_data\20240501\data\raw\raw_match_parquet\venue_12295430.parquet to ../Data/Venue\venue_12295430.parquet
Copied ../Raw_Data/raw_data\20240501\data\raw\raw_match_parquet\venue_12295431.parquet to ../Data/Venue\venue_12295431.parquet
Copied ../Raw_Data/raw_data\20240501\data\raw\raw_match_parquet\venue_12295432.parquet to ../Data/Venue\venue_12295432.parquet
Copied ../Raw_Data/raw_data\20240501\data\raw\raw_match_parquet\venue_12295433.parquet to ../Data/Venue\venue_12295433.parquet
Copied ../Raw_Data/raw_data\20240501\data\raw\raw_match_parquet\venue_12295434.parquet to ../Data/Venue\venue_12295434.parquet
Copied ../Raw_Data/raw_data\20240501\data\raw\raw_match_parquet\venue_12295435.parquet to ../Data/Venue\venue_1

Copied ../Raw_Data/raw_data\20240502\data\raw\raw_match_parquet\venue_12295739.parquet to ../Data/Venue\venue_12295739.parquet
Copied ../Raw_Data/raw_data\20240502\data\raw\raw_match_parquet\venue_12295981.parquet to ../Data/Venue\venue_12295981.parquet
Copied ../Raw_Data/raw_data\20240502\data\raw\raw_match_parquet\venue_12296111.parquet to ../Data/Venue\venue_12296111.parquet
Copied ../Raw_Data/raw_data\20240502\data\raw\raw_match_parquet\venue_12296133.parquet to ../Data/Venue\venue_12296133.parquet
Copied ../Raw_Data/raw_data\20240502\data\raw\raw_match_parquet\venue_12296279.parquet to ../Data/Venue\venue_12296279.parquet
Copied ../Raw_Data/raw_data\20240502\data\raw\raw_match_parquet\venue_12296445.parquet to ../Data/Venue\venue_12296445.parquet
Copied ../Raw_Data/raw_data\20240502\data\raw\raw_match_parquet\venue_12297011.parquet to ../Data/Venue\venue_12297011.parquet
Copied ../Raw_Data/raw_data\20240502\data\raw\raw_match_parquet\venue_12297829.parquet to ../Data/Venue\venue_1

Copied ../Raw_Data/raw_data\20240503\data\raw\raw_match_parquet\venue_12301549.parquet to ../Data/Venue\venue_12301549.parquet
Copied ../Raw_Data/raw_data\20240503\data\raw\raw_match_parquet\venue_12301588.parquet to ../Data/Venue\venue_12301588.parquet
Copied ../Raw_Data/raw_data\20240503\data\raw\raw_match_parquet\venue_12301594.parquet to ../Data/Venue\venue_12301594.parquet
Copied ../Raw_Data/raw_data\20240503\data\raw\raw_match_parquet\venue_12301636.parquet to ../Data/Venue\venue_12301636.parquet
Copied ../Raw_Data/raw_data\20240503\data\raw\raw_match_parquet\venue_12301637.parquet to ../Data/Venue\venue_12301637.parquet
Copied ../Raw_Data/raw_data\20240503\data\raw\raw_match_parquet\venue_12301647.parquet to ../Data/Venue\venue_12301647.parquet
Copied ../Raw_Data/raw_data\20240503\data\raw\raw_match_parquet\venue_12301676.parquet to ../Data/Venue\venue_12301676.parquet
Copied ../Raw_Data/raw_data\20240503\data\raw\raw_match_parquet\venue_12301690.parquet to ../Data/Venue\venue_1

Copied ../Raw_Data/raw_data\20240504\data\raw\raw_match_parquet\venue_12306142.parquet to ../Data/Venue\venue_12306142.parquet
Copied ../Raw_Data/raw_data\20240504\data\raw\raw_match_parquet\venue_12306143.parquet to ../Data/Venue\venue_12306143.parquet
Copied ../Raw_Data/raw_data\20240504\data\raw\raw_match_parquet\venue_12306144.parquet to ../Data/Venue\venue_12306144.parquet
Copied ../Raw_Data/raw_data\20240504\data\raw\raw_match_parquet\venue_12306145.parquet to ../Data/Venue\venue_12306145.parquet
Copied ../Raw_Data/raw_data\20240504\data\raw\raw_match_parquet\venue_12306146.parquet to ../Data/Venue\venue_12306146.parquet
Copied ../Raw_Data/raw_data\20240504\data\raw\raw_match_parquet\venue_12306147.parquet to ../Data/Venue\venue_12306147.parquet
Copied ../Raw_Data/raw_data\20240504\data\raw\raw_match_parquet\venue_12306148.parquet to ../Data/Venue\venue_12306148.parquet
Copied ../Raw_Data/raw_data\20240504\data\raw\raw_match_parquet\venue_12306149.parquet to ../Data/Venue\venue_1

Copied ../Raw_Data/raw_data\20240505\data\raw\raw_match_parquet\venue_12306163.parquet to ../Data/Venue\venue_12306163.parquet
Copied ../Raw_Data/raw_data\20240505\data\raw\raw_match_parquet\venue_12306318.parquet to ../Data/Venue\venue_12306318.parquet
Copied ../Raw_Data/raw_data\20240505\data\raw\raw_match_parquet\venue_12306320.parquet to ../Data/Venue\venue_12306320.parquet
Copied ../Raw_Data/raw_data\20240505\data\raw\raw_match_parquet\venue_12306321.parquet to ../Data/Venue\venue_12306321.parquet
Copied ../Raw_Data/raw_data\20240505\data\raw\raw_match_parquet\venue_12306322.parquet to ../Data/Venue\venue_12306322.parquet
Copied ../Raw_Data/raw_data\20240505\data\raw\raw_match_parquet\venue_12306325.parquet to ../Data/Venue\venue_12306325.parquet
Copied ../Raw_Data/raw_data\20240505\data\raw\raw_match_parquet\venue_12306326.parquet to ../Data/Venue\venue_12306326.parquet
Copied ../Raw_Data/raw_data\20240505\data\raw\raw_match_parquet\venue_12306382.parquet to ../Data/Venue\venue_1

Copied ../Raw_Data/raw_data\20240505\data\raw\raw_match_parquet\venue_12309107.parquet to ../Data/Venue\venue_12309107.parquet
Copied ../Raw_Data/raw_data\20240505\data\raw\raw_match_parquet\venue_12309108.parquet to ../Data/Venue\venue_12309108.parquet
Copied ../Raw_Data/raw_data\20240505\data\raw\raw_match_parquet\venue_12309109.parquet to ../Data/Venue\venue_12309109.parquet
Copied ../Raw_Data/raw_data\20240505\data\raw\raw_match_parquet\venue_12309110.parquet to ../Data/Venue\venue_12309110.parquet
Copied ../Raw_Data/raw_data\20240505\data\raw\raw_match_parquet\venue_12309112.parquet to ../Data/Venue\venue_12309112.parquet
Copied ../Raw_Data/raw_data\20240505\data\raw\raw_match_parquet\venue_12309115.parquet to ../Data/Venue\venue_12309115.parquet
Copied ../Raw_Data/raw_data\20240505\data\raw\raw_match_parquet\venue_12309116.parquet to ../Data/Venue\venue_12309116.parquet
Copied ../Raw_Data/raw_data\20240505\data\raw\raw_match_parquet\venue_12309126.parquet to ../Data/Venue\venue_1

Copied ../Raw_Data/raw_data\20240506\data\raw\raw_match_parquet\venue_12307322.parquet to ../Data/Venue\venue_12307322.parquet
Copied ../Raw_Data/raw_data\20240506\data\raw\raw_match_parquet\venue_12307327.parquet to ../Data/Venue\venue_12307327.parquet
Copied ../Raw_Data/raw_data\20240506\data\raw\raw_match_parquet\venue_12307363.parquet to ../Data/Venue\venue_12307363.parquet
Copied ../Raw_Data/raw_data\20240506\data\raw\raw_match_parquet\venue_12307370.parquet to ../Data/Venue\venue_12307370.parquet
Copied ../Raw_Data/raw_data\20240506\data\raw\raw_match_parquet\venue_12307376.parquet to ../Data/Venue\venue_12307376.parquet
Copied ../Raw_Data/raw_data\20240506\data\raw\raw_match_parquet\venue_12309144.parquet to ../Data/Venue\venue_12309144.parquet
Copied ../Raw_Data/raw_data\20240506\data\raw\raw_match_parquet\venue_12309239.parquet to ../Data/Venue\venue_12309239.parquet
Copied ../Raw_Data/raw_data\20240506\data\raw\raw_match_parquet\venue_12309240.parquet to ../Data/Venue\venue_1

Copied ../Raw_Data/raw_data\20240506\data\raw\raw_match_parquet\venue_12309894.parquet to ../Data/Venue\venue_12309894.parquet
Copied ../Raw_Data/raw_data\20240506\data\raw\raw_match_parquet\venue_12309895.parquet to ../Data/Venue\venue_12309895.parquet
Copied ../Raw_Data/raw_data\20240506\data\raw\raw_match_parquet\venue_12309896.parquet to ../Data/Venue\venue_12309896.parquet
Copied ../Raw_Data/raw_data\20240506\data\raw\raw_match_parquet\venue_12309897.parquet to ../Data/Venue\venue_12309897.parquet
Copied ../Raw_Data/raw_data\20240506\data\raw\raw_match_parquet\venue_12309898.parquet to ../Data/Venue\venue_12309898.parquet
Copied ../Raw_Data/raw_data\20240506\data\raw\raw_match_parquet\venue_12309899.parquet to ../Data/Venue\venue_12309899.parquet
Copied ../Raw_Data/raw_data\20240506\data\raw\raw_match_parquet\venue_12309900.parquet to ../Data/Venue\venue_12309900.parquet
Copied ../Raw_Data/raw_data\20240506\data\raw\raw_match_parquet\venue_12309901.parquet to ../Data/Venue\venue_1

Copied ../Raw_Data/raw_data\20240507\data\raw\raw_match_parquet\venue_12310128.parquet to ../Data/Venue\venue_12310128.parquet
Copied ../Raw_Data/raw_data\20240507\data\raw\raw_match_parquet\venue_12310130.parquet to ../Data/Venue\venue_12310130.parquet
Copied ../Raw_Data/raw_data\20240507\data\raw\raw_match_parquet\venue_12310133.parquet to ../Data/Venue\venue_12310133.parquet
Copied ../Raw_Data/raw_data\20240507\data\raw\raw_match_parquet\venue_12310135.parquet to ../Data/Venue\venue_12310135.parquet
Copied ../Raw_Data/raw_data\20240507\data\raw\raw_match_parquet\venue_12310137.parquet to ../Data/Venue\venue_12310137.parquet
Copied ../Raw_Data/raw_data\20240507\data\raw\raw_match_parquet\venue_12310700.parquet to ../Data/Venue\venue_12310700.parquet
Copied ../Raw_Data/raw_data\20240507\data\raw\raw_match_parquet\venue_12311266.parquet to ../Data/Venue\venue_12311266.parquet
Copied ../Raw_Data/raw_data\20240507\data\raw\raw_match_parquet\venue_12311391.parquet to ../Data/Venue\venue_1

Copied ../Raw_Data/raw_data\20240507\data\raw\raw_match_parquet\venue_12313740.parquet to ../Data/Venue\venue_12313740.parquet
Copied ../Raw_Data/raw_data\20240507\data\raw\raw_match_parquet\venue_12313743.parquet to ../Data/Venue\venue_12313743.parquet
Copied ../Raw_Data/raw_data\20240507\data\raw\raw_match_parquet\venue_12313745.parquet to ../Data/Venue\venue_12313745.parquet
Copied ../Raw_Data/raw_data\20240507\data\raw\raw_match_parquet\venue_12313746.parquet to ../Data/Venue\venue_12313746.parquet
Copied ../Raw_Data/raw_data\20240507\data\raw\raw_match_parquet\venue_12313747.parquet to ../Data/Venue\venue_12313747.parquet
Copied ../Raw_Data/raw_data\20240507\data\raw\raw_match_parquet\venue_12313749.parquet to ../Data/Venue\venue_12313749.parquet
Copied ../Raw_Data/raw_data\20240507\data\raw\raw_match_parquet\venue_12313750.parquet to ../Data/Venue\venue_12313750.parquet
Copied ../Raw_Data/raw_data\20240507\data\raw\raw_match_parquet\venue_12313758.parquet to ../Data/Venue\venue_1

Copied ../Raw_Data/raw_data\20240508\data\raw\raw_match_parquet\venue_12313742.parquet to ../Data/Venue\venue_12313742.parquet
Copied ../Raw_Data/raw_data\20240508\data\raw\raw_match_parquet\venue_12313744.parquet to ../Data/Venue\venue_12313744.parquet
Copied ../Raw_Data/raw_data\20240508\data\raw\raw_match_parquet\venue_12313748.parquet to ../Data/Venue\venue_12313748.parquet
Copied ../Raw_Data/raw_data\20240508\data\raw\raw_match_parquet\venue_12313751.parquet to ../Data/Venue\venue_12313751.parquet
Copied ../Raw_Data/raw_data\20240508\data\raw\raw_match_parquet\venue_12313763.parquet to ../Data/Venue\venue_12313763.parquet
Copied ../Raw_Data/raw_data\20240508\data\raw\raw_match_parquet\venue_12315161.parquet to ../Data/Venue\venue_12315161.parquet
Copied ../Raw_Data/raw_data\20240508\data\raw\raw_match_parquet\venue_12315164.parquet to ../Data/Venue\venue_12315164.parquet
Copied ../Raw_Data/raw_data\20240508\data\raw\raw_match_parquet\venue_12315216.parquet to ../Data/Venue\venue_1

Copied ../Raw_Data/raw_data\20240509\data\raw\raw_match_parquet\venue_12302326.parquet to ../Data/Venue\venue_12302326.parquet
Copied ../Raw_Data/raw_data\20240509\data\raw\raw_match_parquet\venue_12302332.parquet to ../Data/Venue\venue_12302332.parquet
Copied ../Raw_Data/raw_data\20240509\data\raw\raw_match_parquet\venue_12311906.parquet to ../Data/Venue\venue_12311906.parquet
Copied ../Raw_Data/raw_data\20240509\data\raw\raw_match_parquet\venue_12311908.parquet to ../Data/Venue\venue_12311908.parquet
Copied ../Raw_Data/raw_data\20240509\data\raw\raw_match_parquet\venue_12311910.parquet to ../Data/Venue\venue_12311910.parquet
Copied ../Raw_Data/raw_data\20240509\data\raw\raw_match_parquet\venue_12311912.parquet to ../Data/Venue\venue_12311912.parquet
Copied ../Raw_Data/raw_data\20240509\data\raw\raw_match_parquet\venue_12311913.parquet to ../Data/Venue\venue_12311913.parquet
Copied ../Raw_Data/raw_data\20240509\data\raw\raw_match_parquet\venue_12311914.parquet to ../Data/Venue\venue_1

Copied ../Raw_Data/raw_data\20240510\data\raw\raw_match_parquet\venue_12321031.parquet to ../Data/Venue\venue_12321031.parquet
Copied ../Raw_Data/raw_data\20240510\data\raw\raw_match_parquet\venue_12321094.parquet to ../Data/Venue\venue_12321094.parquet
Copied ../Raw_Data/raw_data\20240510\data\raw\raw_match_parquet\venue_12321141.parquet to ../Data/Venue\venue_12321141.parquet
Copied ../Raw_Data/raw_data\20240510\data\raw\raw_match_parquet\venue_12321191.parquet to ../Data/Venue\venue_12321191.parquet
Copied ../Raw_Data/raw_data\20240510\data\raw\raw_match_parquet\venue_12321293.parquet to ../Data/Venue\venue_12321293.parquet
Copied ../Raw_Data/raw_data\20240510\data\raw\raw_match_parquet\venue_12321419.parquet to ../Data/Venue\venue_12321419.parquet
Copied ../Raw_Data/raw_data\20240510\data\raw\raw_match_parquet\venue_12321473.parquet to ../Data/Venue\venue_12321473.parquet
Copied ../Raw_Data/raw_data\20240510\data\raw\raw_match_parquet\venue_12321510.parquet to ../Data/Venue\venue_1

Copied ../Raw_Data/raw_data\20240511\data\raw\raw_match_parquet\venue_12326114.parquet to ../Data/Venue\venue_12326114.parquet
Copied ../Raw_Data/raw_data\20240511\data\raw\raw_match_parquet\venue_12326115.parquet to ../Data/Venue\venue_12326115.parquet
Copied ../Raw_Data/raw_data\20240511\data\raw\raw_match_parquet\venue_12326116.parquet to ../Data/Venue\venue_12326116.parquet
Copied ../Raw_Data/raw_data\20240511\data\raw\raw_match_parquet\venue_12326117.parquet to ../Data/Venue\venue_12326117.parquet
Copied ../Raw_Data/raw_data\20240511\data\raw\raw_match_parquet\venue_12326118.parquet to ../Data/Venue\venue_12326118.parquet
Copied ../Raw_Data/raw_data\20240511\data\raw\raw_match_parquet\venue_12326119.parquet to ../Data/Venue\venue_12326119.parquet
Copied ../Raw_Data/raw_data\20240511\data\raw\raw_match_parquet\venue_12326120.parquet to ../Data/Venue\venue_12326120.parquet
Copied ../Raw_Data/raw_data\20240511\data\raw\raw_match_parquet\venue_12326121.parquet to ../Data/Venue\venue_1

Copied ../Raw_Data/raw_data\20240512\data\raw\raw_match_parquet\venue_12326067.parquet to ../Data/Venue\venue_12326067.parquet
Copied ../Raw_Data/raw_data\20240512\data\raw\raw_match_parquet\venue_12326068.parquet to ../Data/Venue\venue_12326068.parquet
Copied ../Raw_Data/raw_data\20240512\data\raw\raw_match_parquet\venue_12326073.parquet to ../Data/Venue\venue_12326073.parquet
Copied ../Raw_Data/raw_data\20240512\data\raw\raw_match_parquet\venue_12326162.parquet to ../Data/Venue\venue_12326162.parquet
Copied ../Raw_Data/raw_data\20240512\data\raw\raw_match_parquet\venue_12326166.parquet to ../Data/Venue\venue_12326166.parquet
Copied ../Raw_Data/raw_data\20240512\data\raw\raw_match_parquet\venue_12326176.parquet to ../Data/Venue\venue_12326176.parquet
Copied ../Raw_Data/raw_data\20240512\data\raw\raw_match_parquet\venue_12326344.parquet to ../Data/Venue\venue_12326344.parquet
Copied ../Raw_Data/raw_data\20240512\data\raw\raw_match_parquet\venue_12326362.parquet to ../Data/Venue\venue_1

Copied ../Raw_Data/raw_data\20240512\data\raw\raw_match_parquet\venue_12328274.parquet to ../Data/Venue\venue_12328274.parquet
Copied ../Raw_Data/raw_data\20240512\data\raw\raw_match_parquet\venue_12328275.parquet to ../Data/Venue\venue_12328275.parquet
Copied ../Raw_Data/raw_data\20240512\data\raw\raw_match_parquet\venue_12328277.parquet to ../Data/Venue\venue_12328277.parquet
Copied ../Raw_Data/raw_data\20240512\data\raw\raw_match_parquet\venue_12328278.parquet to ../Data/Venue\venue_12328278.parquet
Copied ../Raw_Data/raw_data\20240512\data\raw\raw_match_parquet\venue_12328279.parquet to ../Data/Venue\venue_12328279.parquet
Copied ../Raw_Data/raw_data\20240512\data\raw\raw_match_parquet\venue_12328280.parquet to ../Data/Venue\venue_12328280.parquet
Copied ../Raw_Data/raw_data\20240512\data\raw\raw_match_parquet\venue_12328282.parquet to ../Data/Venue\venue_12328282.parquet
Copied ../Raw_Data/raw_data\20240512\data\raw\raw_match_parquet\venue_12328287.parquet to ../Data/Venue\venue_1

Copied ../Raw_Data/raw_data\20240513\data\raw\raw_match_parquet\venue_12327570.parquet to ../Data/Venue\venue_12327570.parquet
Copied ../Raw_Data/raw_data\20240513\data\raw\raw_match_parquet\venue_12327571.parquet to ../Data/Venue\venue_12327571.parquet
Copied ../Raw_Data/raw_data\20240513\data\raw\raw_match_parquet\venue_12327572.parquet to ../Data/Venue\venue_12327572.parquet
Copied ../Raw_Data/raw_data\20240513\data\raw\raw_match_parquet\venue_12327573.parquet to ../Data/Venue\venue_12327573.parquet
Copied ../Raw_Data/raw_data\20240513\data\raw\raw_match_parquet\venue_12327574.parquet to ../Data/Venue\venue_12327574.parquet
Copied ../Raw_Data/raw_data\20240513\data\raw\raw_match_parquet\venue_12327575.parquet to ../Data/Venue\venue_12327575.parquet
Copied ../Raw_Data/raw_data\20240513\data\raw\raw_match_parquet\venue_12327669.parquet to ../Data/Venue\venue_12327669.parquet
Copied ../Raw_Data/raw_data\20240513\data\raw\raw_match_parquet\venue_12327682.parquet to ../Data/Venue\venue_1

Copied ../Raw_Data/raw_data\20240513\data\raw\raw_match_parquet\venue_12331468.parquet to ../Data/Venue\venue_12331468.parquet
Copied ../Raw_Data/raw_data\20240513\data\raw\raw_match_parquet\venue_12331470.parquet to ../Data/Venue\venue_12331470.parquet
Copied ../Raw_Data/raw_data\20240513\data\raw\raw_match_parquet\venue_12331471.parquet to ../Data/Venue\venue_12331471.parquet
Copied ../Raw_Data/raw_data\20240513\data\raw\raw_match_parquet\venue_12331472.parquet to ../Data/Venue\venue_12331472.parquet
Copied ../Raw_Data/raw_data\20240513\data\raw\raw_match_parquet\venue_12331473.parquet to ../Data/Venue\venue_12331473.parquet
Copied ../Raw_Data/raw_data\20240513\data\raw\raw_match_parquet\venue_12331474.parquet to ../Data/Venue\venue_12331474.parquet
Copied ../Raw_Data/raw_data\20240513\data\raw\raw_match_parquet\venue_12331476.parquet to ../Data/Venue\venue_12331476.parquet
Copied ../Raw_Data/raw_data\20240513\data\raw\raw_match_parquet\venue_12331478.parquet to ../Data/Venue\venue_1

Copied ../Raw_Data/raw_data\20240514\data\raw\raw_match_parquet\venue_12331284.parquet to ../Data/Venue\venue_12331284.parquet
Copied ../Raw_Data/raw_data\20240514\data\raw\raw_match_parquet\venue_12331297.parquet to ../Data/Venue\venue_12331297.parquet
Copied ../Raw_Data/raw_data\20240514\data\raw\raw_match_parquet\venue_12331377.parquet to ../Data/Venue\venue_12331377.parquet
Copied ../Raw_Data/raw_data\20240514\data\raw\raw_match_parquet\venue_12331379.parquet to ../Data/Venue\venue_12331379.parquet
Copied ../Raw_Data/raw_data\20240514\data\raw\raw_match_parquet\venue_12331382.parquet to ../Data/Venue\venue_12331382.parquet
Copied ../Raw_Data/raw_data\20240514\data\raw\raw_match_parquet\venue_12331383.parquet to ../Data/Venue\venue_12331383.parquet
Copied ../Raw_Data/raw_data\20240514\data\raw\raw_match_parquet\venue_12331384.parquet to ../Data/Venue\venue_12331384.parquet
Copied ../Raw_Data/raw_data\20240514\data\raw\raw_match_parquet\venue_12331385.parquet to ../Data/Venue\venue_1

Copied ../Raw_Data/raw_data\20240515\data\raw\raw_match_parquet\venue_12299558.parquet to ../Data/Venue\venue_12299558.parquet
Copied ../Raw_Data/raw_data\20240515\data\raw\raw_match_parquet\venue_12299570.parquet to ../Data/Venue\venue_12299570.parquet
Copied ../Raw_Data/raw_data\20240515\data\raw\raw_match_parquet\venue_12302309.parquet to ../Data/Venue\venue_12302309.parquet
Copied ../Raw_Data/raw_data\20240515\data\raw\raw_match_parquet\venue_12317294.parquet to ../Data/Venue\venue_12317294.parquet
Copied ../Raw_Data/raw_data\20240515\data\raw\raw_match_parquet\venue_12317297.parquet to ../Data/Venue\venue_12317297.parquet
Copied ../Raw_Data/raw_data\20240515\data\raw\raw_match_parquet\venue_12317301.parquet to ../Data/Venue\venue_12317301.parquet
Copied ../Raw_Data/raw_data\20240515\data\raw\raw_match_parquet\venue_12317303.parquet to ../Data/Venue\venue_12317303.parquet
Copied ../Raw_Data/raw_data\20240515\data\raw\raw_match_parquet\venue_12317306.parquet to ../Data/Venue\venue_1

Copied ../Raw_Data/raw_data\20240515\data\raw\raw_match_parquet\venue_12336565.parquet to ../Data/Venue\venue_12336565.parquet
Copied ../Raw_Data/raw_data\20240515\data\raw\raw_match_parquet\venue_12336638.parquet to ../Data/Venue\venue_12336638.parquet
Copied ../Raw_Data/raw_data\20240515\data\raw\raw_match_parquet\venue_12336649.parquet to ../Data/Venue\venue_12336649.parquet
Copied ../Raw_Data/raw_data\20240515\data\raw\raw_match_parquet\venue_12336650.parquet to ../Data/Venue\venue_12336650.parquet
Copied ../Raw_Data/raw_data\20240515\data\raw\raw_match_parquet\venue_12336651.parquet to ../Data/Venue\venue_12336651.parquet
Copied ../Raw_Data/raw_data\20240515\data\raw\raw_match_parquet\venue_12336663.parquet to ../Data/Venue\venue_12336663.parquet
Copied ../Raw_Data/raw_data\20240515\data\raw\raw_match_parquet\venue_12336664.parquet to ../Data/Venue\venue_12336664.parquet
Copied ../Raw_Data/raw_data\20240515\data\raw\raw_match_parquet\venue_12336669.parquet to ../Data/Venue\venue_1

Copied ../Raw_Data/raw_data\20240516\data\raw\raw_match_parquet\venue_12339320.parquet to ../Data/Venue\venue_12339320.parquet
Copied ../Raw_Data/raw_data\20240516\data\raw\raw_match_parquet\venue_12339328.parquet to ../Data/Venue\venue_12339328.parquet
Copied ../Raw_Data/raw_data\20240516\data\raw\raw_match_parquet\venue_12339375.parquet to ../Data/Venue\venue_12339375.parquet
Copied ../Raw_Data/raw_data\20240516\data\raw\raw_match_parquet\venue_12339376.parquet to ../Data/Venue\venue_12339376.parquet
Copied ../Raw_Data/raw_data\20240516\data\raw\raw_match_parquet\venue_12339377.parquet to ../Data/Venue\venue_12339377.parquet
Copied ../Raw_Data/raw_data\20240516\data\raw\raw_match_parquet\venue_12339382.parquet to ../Data/Venue\venue_12339382.parquet
Copied ../Raw_Data/raw_data\20240516\data\raw\raw_match_parquet\venue_12339417.parquet to ../Data/Venue\venue_12339417.parquet
Copied ../Raw_Data/raw_data\20240516\data\raw\raw_match_parquet\venue_12339462.parquet to ../Data/Venue\venue_1

Copied ../Raw_Data/raw_data\20240518\data\raw\raw_match_parquet\venue_12341997.parquet to ../Data/Venue\venue_12341997.parquet
Copied ../Raw_Data/raw_data\20240518\data\raw\raw_match_parquet\venue_12341998.parquet to ../Data/Venue\venue_12341998.parquet
Copied ../Raw_Data/raw_data\20240518\data\raw\raw_match_parquet\venue_12342174.parquet to ../Data/Venue\venue_12342174.parquet
Copied ../Raw_Data/raw_data\20240518\data\raw\raw_match_parquet\venue_12342209.parquet to ../Data/Venue\venue_12342209.parquet
Copied ../Raw_Data/raw_data\20240518\data\raw\raw_match_parquet\venue_12342216.parquet to ../Data/Venue\venue_12342216.parquet
Copied ../Raw_Data/raw_data\20240518\data\raw\raw_match_parquet\venue_12342217.parquet to ../Data/Venue\venue_12342217.parquet
Copied ../Raw_Data/raw_data\20240518\data\raw\raw_match_parquet\venue_12342218.parquet to ../Data/Venue\venue_12342218.parquet
Copied ../Raw_Data/raw_data\20240518\data\raw\raw_match_parquet\venue_12342219.parquet to ../Data/Venue\venue_1

Copied ../Raw_Data/raw_data\20240518\data\raw\raw_match_parquet\venue_12344594.parquet to ../Data/Venue\venue_12344594.parquet
Copied ../Raw_Data/raw_data\20240518\data\raw\raw_match_parquet\venue_12344595.parquet to ../Data/Venue\venue_12344595.parquet
Copied ../Raw_Data/raw_data\20240518\data\raw\raw_match_parquet\venue_12344596.parquet to ../Data/Venue\venue_12344596.parquet
Copied ../Raw_Data/raw_data\20240518\data\raw\raw_match_parquet\venue_12344597.parquet to ../Data/Venue\venue_12344597.parquet
Copied ../Raw_Data/raw_data\20240518\data\raw\raw_match_parquet\venue_12344598.parquet to ../Data/Venue\venue_12344598.parquet
Copied ../Raw_Data/raw_data\20240518\data\raw\raw_match_parquet\venue_12344599.parquet to ../Data/Venue\venue_12344599.parquet
Copied ../Raw_Data/raw_data\20240518\data\raw\raw_match_parquet\venue_12344600.parquet to ../Data/Venue\venue_12344600.parquet
Copied ../Raw_Data/raw_data\20240518\data\raw\raw_match_parquet\venue_12344601.parquet to ../Data/Venue\venue_1

Copied ../Raw_Data/raw_data\20240519\data\raw\raw_match_parquet\venue_12344513.parquet to ../Data/Venue\venue_12344513.parquet
Copied ../Raw_Data/raw_data\20240519\data\raw\raw_match_parquet\venue_12344514.parquet to ../Data/Venue\venue_12344514.parquet
Copied ../Raw_Data/raw_data\20240519\data\raw\raw_match_parquet\venue_12344637.parquet to ../Data/Venue\venue_12344637.parquet
Copied ../Raw_Data/raw_data\20240519\data\raw\raw_match_parquet\venue_12344705.parquet to ../Data/Venue\venue_12344705.parquet
Copied ../Raw_Data/raw_data\20240519\data\raw\raw_match_parquet\venue_12344720.parquet to ../Data/Venue\venue_12344720.parquet
Copied ../Raw_Data/raw_data\20240519\data\raw\raw_match_parquet\venue_12344724.parquet to ../Data/Venue\venue_12344724.parquet
Copied ../Raw_Data/raw_data\20240519\data\raw\raw_match_parquet\venue_12344730.parquet to ../Data/Venue\venue_12344730.parquet
Copied ../Raw_Data/raw_data\20240519\data\raw\raw_match_parquet\venue_12344731.parquet to ../Data/Venue\venue_1

Copied ../Raw_Data/raw_data\20240519\data\raw\raw_match_parquet\venue_12346496.parquet to ../Data/Venue\venue_12346496.parquet
Copied ../Raw_Data/raw_data\20240519\data\raw\raw_match_parquet\venue_12346497.parquet to ../Data/Venue\venue_12346497.parquet
Copied ../Raw_Data/raw_data\20240519\data\raw\raw_match_parquet\venue_12346498.parquet to ../Data/Venue\venue_12346498.parquet
Copied ../Raw_Data/raw_data\20240519\data\raw\raw_match_parquet\venue_12346499.parquet to ../Data/Venue\venue_12346499.parquet
Copied ../Raw_Data/raw_data\20240519\data\raw\raw_match_parquet\venue_12346500.parquet to ../Data/Venue\venue_12346500.parquet
Copied ../Raw_Data/raw_data\20240519\data\raw\raw_match_parquet\venue_12346501.parquet to ../Data/Venue\venue_12346501.parquet
Copied ../Raw_Data/raw_data\20240519\data\raw\raw_match_parquet\venue_12346502.parquet to ../Data/Venue\venue_12346502.parquet
Copied ../Raw_Data/raw_data\20240519\data\raw\raw_match_parquet\venue_12346503.parquet to ../Data/Venue\venue_1

Copied ../Raw_Data/raw_data\20240520\data\raw\raw_match_parquet\venue_12346119.parquet to ../Data/Venue\venue_12346119.parquet
Copied ../Raw_Data/raw_data\20240520\data\raw\raw_match_parquet\venue_12346124.parquet to ../Data/Venue\venue_12346124.parquet
Copied ../Raw_Data/raw_data\20240520\data\raw\raw_match_parquet\venue_12346125.parquet to ../Data/Venue\venue_12346125.parquet
Copied ../Raw_Data/raw_data\20240520\data\raw\raw_match_parquet\venue_12346133.parquet to ../Data/Venue\venue_12346133.parquet
Copied ../Raw_Data/raw_data\20240520\data\raw\raw_match_parquet\venue_12346139.parquet to ../Data/Venue\venue_12346139.parquet
Copied ../Raw_Data/raw_data\20240520\data\raw\raw_match_parquet\venue_12346142.parquet to ../Data/Venue\venue_12346142.parquet
Copied ../Raw_Data/raw_data\20240520\data\raw\raw_match_parquet\venue_12346155.parquet to ../Data/Venue\venue_12346155.parquet
Copied ../Raw_Data/raw_data\20240520\data\raw\raw_match_parquet\venue_12346163.parquet to ../Data/Venue\venue_1

Copied ../Raw_Data/raw_data\20240520\data\raw\raw_match_parquet\venue_12350705.parquet to ../Data/Venue\venue_12350705.parquet
Copied ../Raw_Data/raw_data\20240520\data\raw\raw_match_parquet\venue_12350706.parquet to ../Data/Venue\venue_12350706.parquet
Copied ../Raw_Data/raw_data\20240520\data\raw\raw_match_parquet\venue_12350708.parquet to ../Data/Venue\venue_12350708.parquet
Copied ../Raw_Data/raw_data\20240520\data\raw\raw_match_parquet\venue_12350709.parquet to ../Data/Venue\venue_12350709.parquet
Copied ../Raw_Data/raw_data\20240520\data\raw\raw_match_parquet\venue_12350710.parquet to ../Data/Venue\venue_12350710.parquet
Copied ../Raw_Data/raw_data\20240520\data\raw\raw_match_parquet\venue_12350711.parquet to ../Data/Venue\venue_12350711.parquet
Copied ../Raw_Data/raw_data\20240520\data\raw\raw_match_parquet\venue_12350712.parquet to ../Data/Venue\venue_12350712.parquet
Copied ../Raw_Data/raw_data\20240520\data\raw\raw_match_parquet\venue_12350715.parquet to ../Data/Venue\venue_1

Copied ../Raw_Data/raw_data\20240521\data\raw\raw_match_parquet\venue_12350523.parquet to ../Data/Venue\venue_12350523.parquet
Copied ../Raw_Data/raw_data\20240521\data\raw\raw_match_parquet\venue_12350598.parquet to ../Data/Venue\venue_12350598.parquet
Copied ../Raw_Data/raw_data\20240521\data\raw\raw_match_parquet\venue_12350619.parquet to ../Data/Venue\venue_12350619.parquet
Copied ../Raw_Data/raw_data\20240521\data\raw\raw_match_parquet\venue_12350681.parquet to ../Data/Venue\venue_12350681.parquet
Copied ../Raw_Data/raw_data\20240521\data\raw\raw_match_parquet\venue_12350714.parquet to ../Data/Venue\venue_12350714.parquet
Copied ../Raw_Data/raw_data\20240521\data\raw\raw_match_parquet\venue_12350718.parquet to ../Data/Venue\venue_12350718.parquet
Copied ../Raw_Data/raw_data\20240521\data\raw\raw_match_parquet\venue_12350745.parquet to ../Data/Venue\venue_12350745.parquet
Copied ../Raw_Data/raw_data\20240521\data\raw\raw_match_parquet\venue_12350903.parquet to ../Data/Venue\venue_1

Copied ../Raw_Data/raw_data\20240521\data\raw\raw_match_parquet\venue_12354710.parquet to ../Data/Venue\venue_12354710.parquet
Copied ../Raw_Data/raw_data\20240521\data\raw\raw_match_parquet\venue_12354712.parquet to ../Data/Venue\venue_12354712.parquet
Copied ../Raw_Data/raw_data\20240521\data\raw\raw_match_parquet\venue_12354767.parquet to ../Data/Venue\venue_12354767.parquet
Copied ../Raw_Data/raw_data\20240521\data\raw\raw_match_parquet\venue_12354781.parquet to ../Data/Venue\venue_12354781.parquet
Copied ../Raw_Data/raw_data\20240521\data\raw\raw_match_parquet\venue_12354941.parquet to ../Data/Venue\venue_12354941.parquet
Copied ../Raw_Data/raw_data\20240521\data\raw\raw_match_parquet\venue_12354969.parquet to ../Data/Venue\venue_12354969.parquet
Copied ../Raw_Data/raw_data\20240521\data\raw\raw_match_parquet\venue_12354971.parquet to ../Data/Venue\venue_12354971.parquet
Copied ../Raw_Data/raw_data\20240521\data\raw\raw_match_parquet\venue_12355086.parquet to ../Data/Venue\venue_1

Copied ../Raw_Data/raw_data\20240522\data\raw\raw_match_parquet\venue_12356459.parquet to ../Data/Venue\venue_12356459.parquet
Copied ../Raw_Data/raw_data\20240522\data\raw\raw_match_parquet\venue_12357013.parquet to ../Data/Venue\venue_12357013.parquet
Copied ../Raw_Data/raw_data\20240522\data\raw\raw_match_parquet\venue_12357061.parquet to ../Data/Venue\venue_12357061.parquet
Copied ../Raw_Data/raw_data\20240522\data\raw\raw_match_parquet\venue_12357062.parquet to ../Data/Venue\venue_12357062.parquet
Copied ../Raw_Data/raw_data\20240522\data\raw\raw_match_parquet\venue_12357063.parquet to ../Data/Venue\venue_12357063.parquet
Copied ../Raw_Data/raw_data\20240522\data\raw\raw_match_parquet\venue_12357402.parquet to ../Data/Venue\venue_12357402.parquet
Copied ../Raw_Data/raw_data\20240522\data\raw\raw_match_parquet\venue_12357403.parquet to ../Data/Venue\venue_12357403.parquet
Copied ../Raw_Data/raw_data\20240522\data\raw\raw_match_parquet\venue_12357470.parquet to ../Data/Venue\venue_1

Copied ../Raw_Data/raw_data\20240523\data\raw\raw_match_parquet\venue_12357923.parquet to ../Data/Venue\venue_12357923.parquet
Copied ../Raw_Data/raw_data\20240523\data\raw\raw_match_parquet\venue_12358197.parquet to ../Data/Venue\venue_12358197.parquet
Copied ../Raw_Data/raw_data\20240523\data\raw\raw_match_parquet\venue_12358394.parquet to ../Data/Venue\venue_12358394.parquet
Copied ../Raw_Data/raw_data\20240523\data\raw\raw_match_parquet\venue_12358489.parquet to ../Data/Venue\venue_12358489.parquet
Copied ../Raw_Data/raw_data\20240523\data\raw\raw_match_parquet\venue_12358562.parquet to ../Data/Venue\venue_12358562.parquet
Copied ../Raw_Data/raw_data\20240523\data\raw\raw_match_parquet\venue_12358563.parquet to ../Data/Venue\venue_12358563.parquet
Copied ../Raw_Data/raw_data\20240523\data\raw\raw_match_parquet\venue_12358578.parquet to ../Data/Venue\venue_12358578.parquet
Copied ../Raw_Data/raw_data\20240523\data\raw\raw_match_parquet\venue_12358588.parquet to ../Data/Venue\venue_1

Copied ../Raw_Data/raw_data\20240524\data\raw\raw_match_parquet\venue_12365871.parquet to ../Data/Venue\venue_12365871.parquet
Copied ../Raw_Data/raw_data\20240524\data\raw\raw_match_parquet\venue_12365890.parquet to ../Data/Venue\venue_12365890.parquet
Copied ../Raw_Data/raw_data\20240524\data\raw\raw_match_parquet\venue_12365891.parquet to ../Data/Venue\venue_12365891.parquet
Copied ../Raw_Data/raw_data\20240524\data\raw\raw_match_parquet\venue_12365896.parquet to ../Data/Venue\venue_12365896.parquet
Copied ../Raw_Data/raw_data\20240524\data\raw\raw_match_parquet\venue_12365914.parquet to ../Data/Venue\venue_12365914.parquet
Copied ../Raw_Data/raw_data\20240524\data\raw\raw_match_parquet\venue_12365963.parquet to ../Data/Venue\venue_12365963.parquet
Copied ../Raw_Data/raw_data\20240524\data\raw\raw_match_parquet\venue_12365971.parquet to ../Data/Venue\venue_12365971.parquet
Copied ../Raw_Data/raw_data\20240524\data\raw\raw_match_parquet\venue_12365972.parquet to ../Data/Venue\venue_1

Copied ../Raw_Data/raw_data\20240525\data\raw\raw_match_parquet\venue_12368623.parquet to ../Data/Venue\venue_12368623.parquet
Copied ../Raw_Data/raw_data\20240525\data\raw\raw_match_parquet\venue_12368629.parquet to ../Data/Venue\venue_12368629.parquet
Copied ../Raw_Data/raw_data\20240525\data\raw\raw_match_parquet\venue_12368630.parquet to ../Data/Venue\venue_12368630.parquet
Copied ../Raw_Data/raw_data\20240525\data\raw\raw_match_parquet\venue_12368631.parquet to ../Data/Venue\venue_12368631.parquet
Copied ../Raw_Data/raw_data\20240525\data\raw\raw_match_parquet\venue_12368632.parquet to ../Data/Venue\venue_12368632.parquet
Copied ../Raw_Data/raw_data\20240525\data\raw\raw_match_parquet\venue_12368633.parquet to ../Data/Venue\venue_12368633.parquet
Copied ../Raw_Data/raw_data\20240525\data\raw\raw_match_parquet\venue_12368634.parquet to ../Data/Venue\venue_12368634.parquet
Copied ../Raw_Data/raw_data\20240525\data\raw\raw_match_parquet\venue_12368635.parquet to ../Data/Venue\venue_1

Copied ../Raw_Data/raw_data\20240526\data\raw\raw_match_parquet\venue_12368728.parquet to ../Data/Venue\venue_12368728.parquet
Copied ../Raw_Data/raw_data\20240526\data\raw\raw_match_parquet\venue_12368761.parquet to ../Data/Venue\venue_12368761.parquet
Copied ../Raw_Data/raw_data\20240526\data\raw\raw_match_parquet\venue_12368843.parquet to ../Data/Venue\venue_12368843.parquet
Copied ../Raw_Data/raw_data\20240526\data\raw\raw_match_parquet\venue_12368844.parquet to ../Data/Venue\venue_12368844.parquet
Copied ../Raw_Data/raw_data\20240526\data\raw\raw_match_parquet\venue_12368902.parquet to ../Data/Venue\venue_12368902.parquet
Copied ../Raw_Data/raw_data\20240526\data\raw\raw_match_parquet\venue_12369040.parquet to ../Data/Venue\venue_12369040.parquet
Copied ../Raw_Data/raw_data\20240526\data\raw\raw_match_parquet\venue_12369041.parquet to ../Data/Venue\venue_12369041.parquet
Copied ../Raw_Data/raw_data\20240526\data\raw\raw_match_parquet\venue_12369043.parquet to ../Data/Venue\venue_1

Copied ../Raw_Data/raw_data\20240526\data\raw\raw_match_parquet\venue_12370534.parquet to ../Data/Venue\venue_12370534.parquet
Copied ../Raw_Data/raw_data\20240526\data\raw\raw_match_parquet\venue_12370535.parquet to ../Data/Venue\venue_12370535.parquet
Copied ../Raw_Data/raw_data\20240526\data\raw\raw_match_parquet\venue_12370536.parquet to ../Data/Venue\venue_12370536.parquet
Copied ../Raw_Data/raw_data\20240526\data\raw\raw_match_parquet\venue_12370537.parquet to ../Data/Venue\venue_12370537.parquet
Copied ../Raw_Data/raw_data\20240526\data\raw\raw_match_parquet\venue_12370538.parquet to ../Data/Venue\venue_12370538.parquet
Copied ../Raw_Data/raw_data\20240526\data\raw\raw_match_parquet\venue_12370539.parquet to ../Data/Venue\venue_12370539.parquet
Copied ../Raw_Data/raw_data\20240526\data\raw\raw_match_parquet\venue_12370540.parquet to ../Data/Venue\venue_12370540.parquet
Copied ../Raw_Data/raw_data\20240526\data\raw\raw_match_parquet\venue_12370541.parquet to ../Data/Venue\venue_1

Copied ../Raw_Data/raw_data\20240527\data\raw\raw_match_parquet\venue_12370190.parquet to ../Data/Venue\venue_12370190.parquet
Copied ../Raw_Data/raw_data\20240527\data\raw\raw_match_parquet\venue_12370191.parquet to ../Data/Venue\venue_12370191.parquet
Copied ../Raw_Data/raw_data\20240527\data\raw\raw_match_parquet\venue_12370579.parquet to ../Data/Venue\venue_12370579.parquet
Copied ../Raw_Data/raw_data\20240527\data\raw\raw_match_parquet\venue_12370668.parquet to ../Data/Venue\venue_12370668.parquet
Copied ../Raw_Data/raw_data\20240527\data\raw\raw_match_parquet\venue_12370670.parquet to ../Data/Venue\venue_12370670.parquet
Copied ../Raw_Data/raw_data\20240527\data\raw\raw_match_parquet\venue_12370673.parquet to ../Data/Venue\venue_12370673.parquet
Copied ../Raw_Data/raw_data\20240527\data\raw\raw_match_parquet\venue_12370675.parquet to ../Data/Venue\venue_12370675.parquet
Copied ../Raw_Data/raw_data\20240527\data\raw\raw_match_parquet\venue_12370689.parquet to ../Data/Venue\venue_1

Copied ../Raw_Data/raw_data\20240527\data\raw\raw_match_parquet\venue_12373035.parquet to ../Data/Venue\venue_12373035.parquet
Copied ../Raw_Data/raw_data\20240527\data\raw\raw_match_parquet\venue_12373044.parquet to ../Data/Venue\venue_12373044.parquet
Copied ../Raw_Data/raw_data\20240527\data\raw\raw_match_parquet\venue_12373045.parquet to ../Data/Venue\venue_12373045.parquet
Copied ../Raw_Data/raw_data\20240527\data\raw\raw_match_parquet\venue_12373046.parquet to ../Data/Venue\venue_12373046.parquet
Copied ../Raw_Data/raw_data\20240527\data\raw\raw_match_parquet\venue_12373047.parquet to ../Data/Venue\venue_12373047.parquet
Copied ../Raw_Data/raw_data\20240527\data\raw\raw_match_parquet\venue_12373049.parquet to ../Data/Venue\venue_12373049.parquet
Copied ../Raw_Data/raw_data\20240527\data\raw\raw_match_parquet\venue_12373050.parquet to ../Data/Venue\venue_12373050.parquet
Copied ../Raw_Data/raw_data\20240527\data\raw\raw_match_parquet\venue_12373051.parquet to ../Data/Venue\venue_1

Copied ../Raw_Data/raw_data\20240528\data\raw\raw_match_parquet\venue_12372763.parquet to ../Data/Venue\venue_12372763.parquet
Copied ../Raw_Data/raw_data\20240528\data\raw\raw_match_parquet\venue_12372998.parquet to ../Data/Venue\venue_12372998.parquet
Copied ../Raw_Data/raw_data\20240528\data\raw\raw_match_parquet\venue_12373000.parquet to ../Data/Venue\venue_12373000.parquet
Copied ../Raw_Data/raw_data\20240528\data\raw\raw_match_parquet\venue_12373036.parquet to ../Data/Venue\venue_12373036.parquet
Copied ../Raw_Data/raw_data\20240528\data\raw\raw_match_parquet\venue_12373075.parquet to ../Data/Venue\venue_12373075.parquet
Copied ../Raw_Data/raw_data\20240528\data\raw\raw_match_parquet\venue_12373077.parquet to ../Data/Venue\venue_12373077.parquet
Copied ../Raw_Data/raw_data\20240528\data\raw\raw_match_parquet\venue_12373079.parquet to ../Data/Venue\venue_12373079.parquet
Copied ../Raw_Data/raw_data\20240528\data\raw\raw_match_parquet\venue_12373199.parquet to ../Data/Venue\venue_1

Copied ../Raw_Data/raw_data\20240528\data\raw\raw_match_parquet\venue_12375659.parquet to ../Data/Venue\venue_12375659.parquet
Copied ../Raw_Data/raw_data\20240528\data\raw\raw_match_parquet\venue_12375660.parquet to ../Data/Venue\venue_12375660.parquet
Copied ../Raw_Data/raw_data\20240528\data\raw\raw_match_parquet\venue_12375661.parquet to ../Data/Venue\venue_12375661.parquet
Copied ../Raw_Data/raw_data\20240528\data\raw\raw_match_parquet\venue_12375662.parquet to ../Data/Venue\venue_12375662.parquet
Copied ../Raw_Data/raw_data\20240528\data\raw\raw_match_parquet\venue_12375663.parquet to ../Data/Venue\venue_12375663.parquet
Copied ../Raw_Data/raw_data\20240528\data\raw\raw_match_parquet\venue_12375667.parquet to ../Data/Venue\venue_12375667.parquet
Copied ../Raw_Data/raw_data\20240528\data\raw\raw_match_parquet\venue_12375668.parquet to ../Data/Venue\venue_12375668.parquet
Copied ../Raw_Data/raw_data\20240528\data\raw\raw_match_parquet\venue_12375669.parquet to ../Data/Venue\venue_1

Copied ../Raw_Data/raw_data\20240529\data\raw\raw_match_parquet\venue_12375800.parquet to ../Data/Venue\venue_12375800.parquet
Copied ../Raw_Data/raw_data\20240529\data\raw\raw_match_parquet\venue_12375866.parquet to ../Data/Venue\venue_12375866.parquet
Copied ../Raw_Data/raw_data\20240529\data\raw\raw_match_parquet\venue_12375884.parquet to ../Data/Venue\venue_12375884.parquet
Copied ../Raw_Data/raw_data\20240529\data\raw\raw_match_parquet\venue_12376138.parquet to ../Data/Venue\venue_12376138.parquet
Copied ../Raw_Data/raw_data\20240529\data\raw\raw_match_parquet\venue_12376171.parquet to ../Data/Venue\venue_12376171.parquet
Copied ../Raw_Data/raw_data\20240529\data\raw\raw_match_parquet\venue_12376172.parquet to ../Data/Venue\venue_12376172.parquet
Copied ../Raw_Data/raw_data\20240529\data\raw\raw_match_parquet\venue_12376222.parquet to ../Data/Venue\venue_12376222.parquet
Copied ../Raw_Data/raw_data\20240529\data\raw\raw_match_parquet\venue_12376338.parquet to ../Data/Venue\venue_1

Copied ../Raw_Data/raw_data\20240530\data\raw\raw_match_parquet\venue_12376220.parquet to ../Data/Venue\venue_12376220.parquet
Copied ../Raw_Data/raw_data\20240530\data\raw\raw_match_parquet\venue_12376385.parquet to ../Data/Venue\venue_12376385.parquet
Copied ../Raw_Data/raw_data\20240530\data\raw\raw_match_parquet\venue_12376756.parquet to ../Data/Venue\venue_12376756.parquet
Copied ../Raw_Data/raw_data\20240530\data\raw\raw_match_parquet\venue_12376800.parquet to ../Data/Venue\venue_12376800.parquet
Copied ../Raw_Data/raw_data\20240530\data\raw\raw_match_parquet\venue_12376802.parquet to ../Data/Venue\venue_12376802.parquet
Copied ../Raw_Data/raw_data\20240530\data\raw\raw_match_parquet\venue_12376895.parquet to ../Data/Venue\venue_12376895.parquet
Copied ../Raw_Data/raw_data\20240530\data\raw\raw_match_parquet\venue_12376902.parquet to ../Data/Venue\venue_12376902.parquet
Copied ../Raw_Data/raw_data\20240530\data\raw\raw_match_parquet\venue_12377251.parquet to ../Data/Venue\venue_1

Copied ../Raw_Data/raw_data\20240531\data\raw\raw_match_parquet\venue_12361492.parquet to ../Data/Venue\venue_12361492.parquet
Copied ../Raw_Data/raw_data\20240531\data\raw\raw_match_parquet\venue_12361494.parquet to ../Data/Venue\venue_12361494.parquet
Copied ../Raw_Data/raw_data\20240531\data\raw\raw_match_parquet\venue_12361500.parquet to ../Data/Venue\venue_12361500.parquet
Copied ../Raw_Data/raw_data\20240531\data\raw\raw_match_parquet\venue_12361503.parquet to ../Data/Venue\venue_12361503.parquet
Copied ../Raw_Data/raw_data\20240531\data\raw\raw_match_parquet\venue_12380437.parquet to ../Data/Venue\venue_12380437.parquet
Copied ../Raw_Data/raw_data\20240531\data\raw\raw_match_parquet\venue_12380438.parquet to ../Data/Venue\venue_12380438.parquet
Copied ../Raw_Data/raw_data\20240531\data\raw\raw_match_parquet\venue_12380451.parquet to ../Data/Venue\venue_12380451.parquet
Copied ../Raw_Data/raw_data\20240531\data\raw\raw_match_parquet\venue_12380454.parquet to ../Data/Venue\venue_1

In [9]:
def create_dataframe(folder_path):
    """
    Reads all Parqucoet files in a folder and concatenates them into a single DataFrame.

    Parameters:
    folder_path (str): The path to the folder containing the Parquet files.

    Returns:
    pd.DataFrame: A DataFrame containing the concatenated data from all Parquet files.
    """
    # List all Parquet files in the folder
    parquet_files = [f for f in os.listdir(folder_path) if f.endswith('.parquet')]
    
    # Read each Parquet file and concatenate into a single dataframe
    dataframes = [pd.read_parquet(os.path.join(folder_path, f)) for f in parquet_files]
    combined_dataframe = pd.concat(dataframes, ignore_index=True)
    
    return combined_dataframe


## Now, We are checking the format of each file to get familiar with data structure

In [None]:
away_team = pd.read_parquet(
    '../Raw_Data/raw_data/20240501/data/raw/raw_match_parquet/away_team_12260075.parquet')
away_team_score = pd.read_parquet(
    '../Raw_Data/raw_data/20240501/data/raw/raw_match_parquet/away_team_score_12260075.parquet')
event = pd.read_parquet(
    '../Raw_Data/raw_data/20240501/data/raw/raw_match_parquet/event_12260075.parquet')
home_team = pd.read_parquet(
'../Raw_Data/raw_data/20240501/data/raw/raw_match_parquet/home_team_12260075.parquet')
home_team_score = pd.read_parquet(
'../Raw_Data/raw_data/20240501/data/raw/raw_match_parquet/home_team_score_12260075.parquet')
rond = pd.read_parquet(
'../Raw_Data/raw_data/20240501/data/raw/raw_match_parquet/round_12260075.parquet')
season = pd.read_parquet(
'../Raw_Data/raw_data/20240501/data/raw/raw_match_parquet/season_12260075.parquet')
time = pd.read_parquet(
'../Raw_Data/raw_data/20240501/data/raw/raw_match_parquet/time_12260075.parquet')
tournoment = pd.read_parquet(
'../Raw_Data/raw_data/20240501/data/raw/raw_match_parquet/tournament_12260075.parquet')
venue = pd.read_parquet(
'../Raw_Data/raw_data/20240501/data/raw/raw_match_parquet/venue_12260075.parquet')
pbp = pd.read_parquet(
'../Raw_Data/raw_data/20240501/data/raw/raw_point_by_point_parquet/pbp_12260075.parquet')
statistics = pd.read_parquet(
'../Raw_Data/raw_data/20240501/data/raw/raw_statistics_parquet/statistics_12260075.parquet')


In [None]:
away_team

In [None]:
away_team_score

In [None]:
home_team

In [None]:
home_team_score

In [None]:
event

In [None]:
rond

In [None]:
season

In [None]:
time

In [None]:
tournoment

In [None]:
venue

In [None]:
pbp

In [None]:
statistics

In [10]:
MatchEventInfo = create_dataframe('../Data/Event/')
MatchVotesInfo = create_dataframe('../Data/Votes/')
MatchTournamentInfo = create_dataframe('../Data/Tournament/')
MatchSeasonInfo = create_dataframe('../Data/Season/')
MatchVenueInfo = create_dataframe('../Data/Venue/')
MatchAwayTeamInfo = create_dataframe('../Data/AwayTeam/')
MatchRoundInfo = create_dataframe('../Data/Round/')
MatchAwayScoreInfo = create_dataframe('../Data/AwayTeamScore/')
MatchHomeScoreInfo = create_dataframe('../Data/HomeTeamScore/')
MatchHomeTeamInfo = create_dataframe('../Data/HomeTeam/')
PowerInfo = create_dataframe('../Data/Power/')
GameInfo = create_dataframe('../Data/GameInfo/')
OddsInfo = create_dataframe('../Data/Odds/')
TimeInfo = create_dataframe('../Data/Time/')
PeriodInfo = create_dataframe('../Data/Stat/')

  combined_dataframe = pd.concat(dataframes, ignore_index=True)
  combined_dataframe = pd.concat(dataframes, ignore_index=True)


In [11]:
MatchEventInfo.to_parquet('../Aggregation/MatchEventInfo.parquet')
MatchVotesInfo.to_parquet('../Aggregation/MatchVotesInfo.parquet')
MatchTournamentInfo.to_parquet('../Aggregation/MatchTournamentInfo.parquet')
MatchSeasonInfo.to_parquet('../Aggregation/MatchSeasonInfo.parquet')
MatchVenueInfo.to_parquet('../Aggregation/MatchVenueInfo.parquet')
MatchAwayTeamInfo.to_parquet('../Aggregation/MatchAwayTeamInfo.parquet')
MatchRoundInfo.to_parquet('../Aggregation/MatchRoundInfo.parquet')
MatchAwayScoreInfo.to_parquet('../Aggregation/MatchAwayScoreInfo.parquet')
MatchHomeScoreInfo.to_parquet('../Aggregation/MatchHomeScoreInfo.parquet')
MatchHomeTeamInfo.to_parquet('../Aggregation/MatchHomeTeamInfo.parquet')
PowerInfo.to_parquet('../Aggregation/PowerInfo.parquet')
GameInfo.to_parquet('../Aggregation/GameInfo.parquet')
OddsInfo.to_parquet('../Aggregation/OddsInfo.parquet')
TimeInfo.to_parquet('../Aggregation/TimeInfo.parquet')
PeriodInfo.to_parquet('../Aggregation/PeriodInfo.parquet')

In [None]:
OddsInfo = create_dataframe('../Data/Odds/')

In [None]:
OddsInfo.shape