In [1]:
import polars as pl
import pandas as pd
import numpy as np
import math as math
# find a better way to import?
import sys
import os
sys.path.append(os.path.join(os.path.dirname(''), '..'))

from constants import *


In [2]:
# read all data
players = pl.read_csv('../nfl-big-data-bowl-2024/players.csv')
plays = pl.read_csv('../nfl-big-data-bowl-2024/plays.csv',infer_schema_length=100000)
games = pl.read_csv('../nfl-big-data-bowl-2024/games.csv',infer_schema_length=10000)
tracking = pl.read_csv('../nfl-big-data-bowl-2024/tracking_week*.csv',infer_schema_length=10000)

In [3]:
# normalize data
players = players.with_columns([pl.col('nflId').cast(str)])
plays = plays.join(games,on='gameId')
plays = plays.with_columns([
    (pl.col('gameId').cast(str) + '-'
     + pl.col('playId').cast(str)).alias('uniquePlayId')
])

tracking = tracking.with_columns(
    (pl.col('gameId').cast(str) + '-'
     + pl.col('playId').cast(str)).alias('uniquePlayId'),
    (pl.col('gameId').cast(str) + '-'
     + pl.col('playId').cast(str) + '-'
     + pl.col('nflId').cast(str)).alias('uniquePlayerId'),
)

# normalize position
tracking=tracking.with_columns([
    pl.when(pl.col('playDirection')=='right').then(53.3-pl.col('y')).otherwise(pl.col('y')).alias('adjustedX'),
    pl.when(pl.col('playDirection')=='right').then(pl.col('x')).otherwise(120-pl.col('x')).alias('adjustedY')
])

tracking=tracking.with_columns([
    pl.when(pl.col('event')=='ball_snap').then(pl.col('frameId')).otherwise(-1).alias('startingFrameId'),
])
tracking=tracking.with_columns([
    pl.col('startingFrameId').max().over(pl.col('uniquePlayId')),
])
tracking=tracking.with_columns([
    (pl.col('frameId') - pl.col('startingFrameId')).alias('framesSinceSnap'),
])

# normalize orientation 'o' and direction 'dir'
# convert 'NA' to 0
replacement_values = {'NA': '0'}
tracking = tracking.with_columns(
    pl.col('o').apply(lambda x: replacement_values.get(x, x)),
    pl.col('dir').apply(lambda x: replacement_values.get(x, x)),
)

tracking=tracking.with_columns([
    pl.when(pl.col('playDirection')=='right').then(pl.col('dir').cast(pl.Float64)).otherwise(180-pl.col('dir').cast(pl.Float64)).alias('adjustedDir'),
    pl.when(pl.col('playDirection')=='right').then(pl.col('o').cast(pl.Float64)).otherwise((180+pl.col('o').cast(pl.Float64))%360).alias('firstAdjustedO'),
])

tracking=tracking.with_columns([
    pl.when(pl.col('firstAdjustedO') <= 180).then(180-pl.col('firstAdjustedO')).otherwise(540-pl.col('firstAdjustedO')).alias('adjustedO')
])

In [5]:
CONE_ANGLE = 120 # degrees
MAX_DISTANCE = 3 # yards
BLOCKING_RADIUS = 1.25 # yards

def angle_in_range(angle, left_boundary, right_boundary):
    return (angle - left_boundary) % 360 <= (right_boundary - left_boundary) % 360

# row = [o, dir, adjustedX, adjustedY, oDefender, dirDefender, adjustedXDefender, adjustedYDefender]
def looking_to_block_or_blocking_df_fn(row) -> int:
    blocking_status = 0
    player1 = row[0:4]
    player2 = row[4:]

    if is_in_vision_cone(player1, player2):
        blocking_status = 1

    if is_blocking(player1, player2) and blocking_status == 1:
        blocking_status = 2

    return blocking_status
    

def looking_to_block_or_blocking(player1: tuple, player2: tuple) -> int:
    blocking_status = 0
    if is_in_vision_cone(player1, player2):
        blocking_status = 1

    if is_blocking(player1, player2) and blocking_status == 1:
        blocking_status = 2

    return 0

def is_in_vision_cone(player1: tuple, player2: tuple, cone_angle=CONE_ANGLE) -> bool:
    return (is_in_angle(player1, player2, cone_angle) and is_in_distance(player1, player2))

def is_in_angle(player1: tuple, player2: tuple, cone_angle) -> bool:
    half_cone_angle = cone_angle / 2

    y_dist = player2[3] - player1[3]
    x_dist = player2[2] - player1[2]
    player1_orientation = float(player1[0]) if type(player1[0]) == str else player1[0]

    # print("isinangle")
    # print("player1")
    # print(player1)

    # print("player2")
    # print(player2)

    # print("player1_ori")
    # print(player1_orientation)

    angle = math.degrees(math.atan2(y_dist, x_dist))
    angle = (angle + 360) % 360
    
    left_vision_boundary = (360 + player1_orientation - half_cone_angle) % 360
    right_vision_boundary = (player1_orientation + half_cone_angle) % 360
    
    
#     print(left_vision_boundary)
#     print(angle)
#     print(right_vision_boundary)
#     print(angle_in_range(angle,left_vision_boundary,right_vision_boundary))

    # print("angle")
    # print(angle)

    if angle_in_range(angle,left_vision_boundary,right_vision_boundary):
        return True
    
    return False

def is_in_distance(player1: tuple, player2: tuple) -> bool:
    distance_between_players = calculate_distance(player1, player2)
    if distance_between_players <= MAX_DISTANCE:
        return True
    
    return False

def is_blocking(player1: tuple, player2: tuple) -> bool:
    distance_between_players = calculate_distance(player1, player2)
    if distance_between_players <= BLOCKING_RADIUS:
        return True

    return False


def calculate_distance(player1: tuple, player2: tuple) -> float:
    y_dist = abs(player1[3] - player2[3])
    x_dist = abs(player1[2] - player2[2])

    # print(y_dist)
    # print(x_dist)
    # print(math.sqrt(x_dist**2 + y_dist**2))

    return math.sqrt(x_dist**2 + y_dist**2)

In [14]:
# We need copy so we don't modify the original list :)
import copy
SIDE_CONE_ANGLES = 150

# 0 => None
# 1 => Box -> Left
# 2 => Dent
# 3 => Spill -> Right
def type_of_block_df_fn(row) -> str:    
    player1 = list(row[0:4])
    player2 = list(row[4:])
    
    if is_dent(player1, copy.copy(player2)):
        return "dent"
    elif is_left_vision_cone(player1, copy.copy(player2)):
        return "left"
    elif is_right_vision_cone(player1, copy.copy(player2)):
        return "right"
    
    return "none"

def is_left_vision_cone(player1: tuple, player2: tuple) -> bool:
    player2[0] = (player2[0] + 90) % 360
    return is_in_angle(player2, player1, SIDE_CONE_ANGLES)

# Both players can see each other
def is_dent(player1: tuple, player2: tuple) -> bool:
    return is_in_vision_cone(player1, player2, 50) and is_in_vision_cone(player2, player1, 50)

def is_right_vision_cone(player1: tuple, player2: tuple) -> bool:
    player2[0] = (player2[0] - 90) % 360
    return is_in_angle(player2, player1, SIDE_CONE_ANGLES)
    

In [7]:
GAME_ID = 2022091500
PLAY_ID = 55
JERSEY_NUMBER = '62'
JERSEY_NUMBER_DEFENDER = '97'

labeled = tracking.filter(pl.col('gameId')==GAME_ID)

players = labeled.join(players,on='nflId',how='left')
players = players.join(games.select(['gameId','homeTeamAbbr','visitorTeamAbbr']),on='gameId')
players = players.with_columns([
    pl.when(pl.col('club')==pl.col('homeTeamAbbr'))
    .then(pl.col('visitorTeamAbbr'))
    .otherwise(pl.col('homeTeamAbbr'))
    .alias('opponentClub')
])


In [8]:
players = players.join(
    players,
    left_on=['gameId','playId','frameId','club'],
    right_on=['gameId','playId','frameId','opponentClub'],
    suffix='Defender'
)

In [9]:
blocking_df = players.select(
    'adjustedO', 'adjustedDir', 'adjustedX', 'adjustedY', 'adjustedODefender', 'adjustedDirDefender', 'adjustedXDefender', 'adjustedYDefender'
).apply(looking_to_block_or_blocking_df_fn)

blocking_df = blocking_df.to_series()
players = players.with_columns(blockType=blocking_df)

In [10]:
test_data = players.filter(pl.col('gameId')==GAME_ID).filter(pl.col('playId')==PLAY_ID)
# test_data = test_data.filter(pl.col('jerseyNumber')=='73').filter(pl.col('framesSinceSnap')==12)
# test_data = test_data.filter(pl.col('jerseyNumberDefender')=='91')

is_blocking_df = test_data.select(
    'adjustedO', 'adjustedDir', 'adjustedX', 'adjustedY', 'adjustedODefender', 
    'adjustedDirDefender', 'adjustedXDefender', 'adjustedYDefender'
).apply(looking_to_block_or_blocking_df_fn)

is_blocking_df = is_blocking_df.to_series()
test_data = test_data.with_columns(blockType=is_blocking_df)

In [11]:
type_of_block_df = test_data.select(
    'adjustedO', 'adjustedDir', 'adjustedX', 'adjustedY', 'adjustedODefender', 
    'adjustedDirDefender', 'adjustedXDefender', 'adjustedYDefender', 'blockType'
).apply(type_of_block_df_fn)

test_data = test_data.with_columns(blockLocation=type_of_block_df.to_series())

In [20]:
%config IPCompleter.greedy=True
%config IPCompleter.display_limit=500 
%config Polars.Lazy.frame_repr.max_elements=500  # Replace 10 with the desired number of rows


test_blocking = test_data.filter(pl.col('jerseyNumber')==JERSEY_NUMBER).filter(pl.col('jerseyNumberDefender')==JERSEY_NUMBER_DEFENDER)
test_blocking.select(
    'adjustedO', 'adjustedDir', 'adjustedX', 'adjustedY', 'adjustedODefender', 
    'adjustedDirDefender', 'adjustedXDefender', 'adjustedYDefender', 'blockType',
    'framesSinceSnap', 'blockLocation'
).filter(pl.col('framesSinceSnap') >= 6).filter(pl.col('framesSinceSnap')>=

adjustedO,adjustedDir,adjustedX,adjustedY,adjustedODefender,adjustedDirDefender,adjustedXDefender,adjustedYDefender,blockType,framesSinceSnap,blockLocation
f64,f64,f64,f64,f64,f64,f64,f64,i64,i64,str
80.08,-32.54,28.07,33.8,245.97,81.62,35.0,35.35,0,-5,"""right"""
81.64,-43.62,28.08,33.8,245.97,100.92,35.01,35.35,0,-4,"""right"""
83.13,-43.7,28.08,33.8,247.56,110.45,35.02,35.34,0,-3,"""right"""
83.13,-47.95,28.08,33.8,247.56,126.32,35.04,35.34,0,-2,"""right"""
83.13,-57.33,28.09,33.8,247.56,130.24,35.04,35.34,0,-1,"""right"""
83.13,-164.93,28.11,33.79,246.7,121.34,35.05,35.32,0,0,"""right"""
82.33,178.18,28.12,33.79,245.93,106.78,35.05,35.3,0,1,"""right"""
81.52,173.78,28.13,33.78,244.84,95.22,35.05,35.28,0,2,"""right"""
80.11,164.91,28.16,33.77,245.72,88.76,35.05,35.23,0,3,"""right"""
78.45,168.12,28.2,33.77,241.88,86.25,35.05,35.16,0,4,"""right"""
