In [1]:
import polars as pl
import pandas as pd
import numpy as np
import math as math
# find a better way to import?
import sys
import os
sys.path.append(os.path.join(os.path.dirname(''), '..'))

from constants import *


In [2]:
# read all data
players = pl.read_csv('../nfl-big-data-bowl-2024/players.csv')
plays = pl.read_csv('../nfl-big-data-bowl-2024/plays.csv',infer_schema_length=100000)
games = pl.read_csv('../nfl-big-data-bowl-2024/games.csv',infer_schema_length=10000)
tracking = pl.read_csv('../nfl-big-data-bowl-2024/tracking_week*.csv',infer_schema_length=10000)

In [3]:
# normalize data
players = players.with_columns([pl.col('nflId').cast(str)])
plays = plays.join(games,on='gameId')
plays = plays.with_columns([
    (pl.col('gameId').cast(str) + '-'
     + pl.col('playId').cast(str)).alias('uniquePlayId')
])

tracking = tracking.with_columns(
    (pl.col('gameId').cast(str) + '-'
     + pl.col('playId').cast(str)).alias('uniquePlayId'),
    (pl.col('gameId').cast(str) + '-'
     + pl.col('playId').cast(str) + '-'
     + pl.col('nflId').cast(str)).alias('uniquePlayerId'),
)

# normalize position
tracking=tracking.with_columns([
    pl.when(pl.col('playDirection')=='right').then(53.3-pl.col('y')).otherwise(pl.col('y')).alias('adjustedX'),
    pl.when(pl.col('playDirection')=='right').then(pl.col('x')).otherwise(120-pl.col('x')).alias('adjustedY')
])

tracking=tracking.with_columns([
    pl.when(pl.col('event')=='ball_snap').then(pl.col('frameId')).otherwise(-1).alias('startingFrameId'),
])
tracking=tracking.with_columns([
    pl.col('startingFrameId').max().over(pl.col('uniquePlayId')),
])
tracking=tracking.with_columns([
    (pl.col('frameId') - pl.col('startingFrameId')).alias('framesSinceSnap'),
])

# normalize orientation 'o' and direction 'dir'
# convert 'NA' to 0
replacement_values = {'NA': '0'}
tracking = tracking.with_columns(
    pl.col('o').apply(lambda x: replacement_values.get(x, x)),
    pl.col('dir').apply(lambda x: replacement_values.get(x, x)),
)

tracking=tracking.with_columns([
    pl.when(pl.col('playDirection')=='right').then(pl.col('dir').cast(pl.Float64)).otherwise(180-pl.col('dir').cast(pl.Float64)).alias('adjustedDir'),
    pl.when(pl.col('playDirection')=='right').then(pl.col('o').cast(pl.Float64)).otherwise((180+pl.col('o').cast(pl.Float64))%360).alias('firstAdjustedO'),
])

tracking=tracking.with_columns([
    pl.when(pl.col('firstAdjustedO') <= 180).then(180-pl.col('firstAdjustedO')).otherwise(540-pl.col('firstAdjustedO')).alias('adjustedO')
])

In [4]:
CONE_ANGLE = 120 # degrees
MAX_DISTANCE = 3 # yards
BLOCKING_RADIUS = 1.25 # yards

def angle_in_range(angle, left_boundary, right_boundary):
    return (angle - left_boundary) % 360 <= (right_boundary - left_boundary) % 360

# row = [o, dir, adjustedX, adjustedY, oDefender, dirDefender, adjustedXDefender, adjustedYDefender]
def looking_to_block_or_blocking_df_fn(row) -> int:
    blocking_status = 0
    player1 = row[0:4]
    player2 = row[4:]

    if is_in_vision_cone(player1, player2):
        blocking_status = 1

    if is_blocking(player1, player2) and blocking_status == 1:
        blocking_status = 2

    return blocking_status
    

def looking_to_block_or_blocking(player1: tuple, player2: tuple) -> int:
    blocking_status = 0
    if is_in_vision_cone(player1, player2):
        blocking_status = 1

    if is_blocking(player1, player2) and blocking_status == 1:
        blocking_status = 2

    return 0

def is_in_vision_cone(player1: tuple, player2: tuple, cone_angle=CONE_ANGLE) -> bool:
    return (is_in_angle(player1, player2, cone_angle) and is_in_distance(player1, player2))

def is_in_angle(player1: tuple, player2: tuple, cone_angle) -> bool:
    half_cone_angle = cone_angle / 2

    y_dist = player2[3] - player1[3]
    x_dist = player2[2] - player1[2]
    player1_orientation = float(player1[0]) if type(player1[0]) == str else player1[0]

    # print("isinangle")
    # print("player1")
    # print(player1)

    # print("player2")
    # print(player2)

    # print("player1_ori")
    # print(player1_orientation)

    angle = math.degrees(math.atan2(y_dist, x_dist))
    angle = (angle + 360) % 360
    
    left_vision_boundary = (360 + player1_orientation - half_cone_angle) % 360
    right_vision_boundary = (player1_orientation + half_cone_angle) % 360
    
    
#     print(left_vision_boundary)
#     print(angle)
#     print(right_vision_boundary)
#     print(angle_in_range(angle,left_vision_boundary,right_vision_boundary))

    # print("angle")
    # print(angle)

    if angle_in_range(angle,left_vision_boundary,right_vision_boundary):
        return True
    
    return False

def is_in_distance(player1: tuple, player2: tuple) -> bool:
    distance_between_players = calculate_distance(player1, player2)
    if distance_between_players <= MAX_DISTANCE:
        return True
    
    return False

def is_blocking(player1: tuple, player2: tuple) -> bool:
    distance_between_players = calculate_distance(player1, player2)
    if distance_between_players <= BLOCKING_RADIUS:
        return True

    return False


def calculate_distance(player1: tuple, player2: tuple) -> float:
    y_dist = abs(player1[3] - player2[3])
    x_dist = abs(player1[2] - player2[2])

    # print(y_dist)
    # print(x_dist)
    # print(math.sqrt(x_dist**2 + y_dist**2))

    return math.sqrt(x_dist**2 + y_dist**2)

In [11]:
# For both box and spill, player2 should be in the vision cone of 1
# This is already checked by row[8] == 0

# 0 => None
# 1 => Box
# 2 => Dent
# 3 => Spill
def type_of_block_df_fn(row) -> int:    
    player1 = row[0:4]
    player2 = row[4:]

        if (row[8] == 0 or not is_in_vision_cone(player1, player2, 50)):
        return 0
    
    if is_box(player1, player2):
        if is_dent(player1, player2):
            return 2
        return 1

    if is_spill(player1, player2):
        return 3
    
    return 0

# Defender (player2) should face the outside
def is_box(player1: tuple, player2: tuple) -> bool:
    # This should be relative to the other player
    if (0 <= player2[0] <= 90 or 270 <= player2[0] <= 360):
            return True
    
    return False

# Both players can see each other
def is_dent(player1: tuple, player2: tuple) -> bool:
    return is_in_vision_cone(player2, player1, 50)

# Defender should face the inside
def is_spill(player1: tuple, player2: tuple) -> bool:
    if (90 <= player2[0] <= 270):
        return True
        
    return False
    

In [6]:
GAME_ID = 2022091110
PLAY_ID = 3797
JERSEY_NUMBER = '62'
JERSEY_NUMBER_DEFENDER = '97'

labeled = tracking.filter(pl.col('gameId')==GAME_ID)

players = labeled.join(players,on='nflId',how='left')
players = players.join(games.select(['gameId','homeTeamAbbr','visitorTeamAbbr']),on='gameId')
players = players.with_columns([
    pl.when(pl.col('club')==pl.col('homeTeamAbbr'))
    .then(pl.col('visitorTeamAbbr'))
    .otherwise(pl.col('homeTeamAbbr'))
    .alias('opponentClub')
])


In [7]:
players = players.join(
    players,
    left_on=['gameId','playId','frameId','club'],
    right_on=['gameId','playId','frameId','opponentClub'],
    suffix='Defender'
)

In [8]:
blocking_df = players.select(
    'adjustedO', 'adjustedDir', 'adjustedX', 'adjustedY', 'adjustedODefender', 'adjustedDirDefender', 'adjustedXDefender', 'adjustedYDefender'
).apply(looking_to_block_or_blocking_df_fn)

blocking_df = blocking_df.to_series()
players = players.with_columns(blockType=blocking_df)

In [9]:
test_data = players.filter(pl.col('gameId')==GAME_ID).filter(pl.col('playId')==PLAY_ID)
# test_data = test_data.filter(pl.col('jerseyNumber')=='73').filter(pl.col('framesSinceSnap')==12)
# test_data = test_data.filter(pl.col('jerseyNumberDefender')=='91')

is_blocking_df = test_data.select(
    'adjustedO', 'adjustedDir', 'adjustedX', 'adjustedY', 'adjustedODefender', 
    'adjustedDirDefender', 'adjustedXDefender', 'adjustedYDefender'
).apply(looking_to_block_or_blocking_df_fn)

is_blocking_df = is_blocking_df.to_series()
test_data = test_data.with_columns(blockType=is_blocking_df)

In [10]:
type_of_block_df = test_data.select(
    'adjustedO', 'adjustedDir', 'adjustedX', 'adjustedY', 'adjustedODefender', 
    'adjustedDirDefender', 'adjustedXDefender', 'adjustedYDefender', 'blockType'
).apply(type_of_block_df_fn)

test_data = test_data.with_columns(boxDentSpill=type_of_block_df.to_series())

PanicException: python function failed UnboundLocalError: cannot access local variable 'player1' where it is not associated with a value

In [14]:
test_blocking = test_data.filter(pl.col('jerseyNumber')==JERSEY_NUMBER).filter(pl.col('jerseyNumberDefender')==JERSEY_NUMBER_DEFENDER)
test_blocking.select(
    'adjustedO', 'adjustedDir', 'adjustedX', 'adjustedY', 'adjustedODefender', 
    'adjustedDirDefender', 'adjustedXDefender', 'adjustedYDefender', 'blockType',
    'framesSinceSnap', 'boxDentSpill'
).filter(pl.col('boxDentSpill') != 0)

adjustedO,adjustedDir,adjustedX,adjustedY,adjustedODefender,adjustedDirDefender,adjustedXDefender,adjustedYDefender,blockType,framesSinceSnap,boxDentSpill
f64,f64,f64,f64,f64,f64,f64,f64,i64,i64,i64
29.58,179.58,33.32,18.11,215.49,15.08,34.17,18.18,2,19,3
24.99,-177.83,33.45,18.11,212.33,-46.56,34.14,18.2,2,20,3
24.99,-168.55,33.55,18.14,208.04,-85.42,34.13,18.24,2,21,3
24.99,-155.89,33.63,18.18,205.09,-96.09,34.13,18.3,2,22,3
30.01,-142.49,33.7,18.22,199.96,-97.28,34.13,18.41,2,23,3
43.88,-131.33,33.77,18.3,198.5,-97.23,34.14,18.53,2,24,3
46.36,-123.65,33.84,18.4,194.74,-96.18,34.15,18.66,2,25,3
53.11,-120.11,33.91,18.5,192.7,-93.85,34.16,18.82,2,26,3
53.84,-116.89,33.96,18.62,189.42,-89.96,34.14,18.99,2,27,3
67.36,-122.19,34.07,18.77,183.23,-85.96,34.12,19.16,2,28,3
