<a href="https://colab.research.google.com/github/Jonathan-Adamson/Predictive-Modeling-in-the-NBA/blob/main/DA401_Code.ipynb" target="_parent"><img src="https://colab.research.google.com/assets/colab-badge.svg" alt="Open In Colab"/></a>

In [1]:
# Importing needed packages

import pandas as pd
import numpy as np

In [8]:
# Loading data

filename = "2021-2022 NBA Player Data.csv"

player_data_2021_2022 = pd.read_csv(filename)

In [7]:
def add_year_column(df, year):
    """
    Add a column named 'year' to the DataFrame with the specified year for every observation.

    Parameters:
    - df (DataFrame): DataFrame object.
    - year (int): Year to be added to the DataFrame.

    Returns:
    - None: Modifies the DataFrame in place.
    """
    # Add a new column named 'year' with the specified year
    df['year'] = year

In [9]:
add_year_column(player_data_2021_2022, 2022)

In [11]:
def inclusion_criteria(df):
    """
    Filter the dataset based on the specified criteria:
    - 'GS' needs to be greater than or equal to 25
    - 'MP' needs to be greater than or equal to 15
    - 'G' needs to be greater than or equal to 50

    Parameters:
    - df (DataFrame): DataFrame to be filtered.

    Returns:
    - filtered_df (DataFrame): Filtered DataFrame based on the criteria.
    """
    filtered_df = df[(df['GS'] >= 25) & (df['MP'] >= 15) & (df['G'] >= 50)]
    return filtered_df


In [None]:
inclusion_criteria(player_data_2021_2022)

In [14]:
def add_all_nba_column(df, names_list):
    """
    Add a new column named 'All_NBA' to the DataFrame based on whether the player's name is in the provided list.

    Parameters:
    - df (DataFrame): DataFrame to which the new column will be added.
    - names_list (list): List of player names.

    Returns:
    - None: Modifies the DataFrame in place.
    """
    # Create a new column 'All_NBA' and set default value to 'No'
    df['All_NBA'] = 'No'

    # Update 'All_NBA' column to 'Yes' for players in the names_list
    df.loc[df['Player'].isin(names_list), 'All_NBA'] = 'Yes'

In [15]:
All_NBA_2022 = ["Giannis Antetokounmpo", "Devin Booker", "Luka Dončić", "Nikola Jokić", "Jayson Tatum", "Stephen Curry",
"DeMar DeRozan", "Kevin Durant", "Joel Embiid", "Ja Morant", "LeBron James", "Chris Paul", "Pascal Siakam", "Karl-Anthony Towns"
"Trae Young"]

In [16]:
add_all_nba_column(player_data_2021_2022, All_NBA_2022)

In [None]:
player_data_2021_2022[player_data_2021_2022["Player"] == 'Ja Morant']