# Analyzing Barstool Sports post metadata

#### Python tools and notebook settings

In [1]:
%load_ext lab_black

In [2]:
import pandas as pd
import altair as alt
import altair_stiles as altstiles
import datetime as dt

In [3]:
alt.themes.register("stiles", altstiles.theme)
alt.themes.enable("stiles")

ThemeRegistry.enable('grid')

In [4]:
pd.options.display.max_columns = 100
pd.options.display.max_rows = 1000
pd.options.display.max_colwidth = None

In [29]:
today = dt.date.today().strftime("%Y-%m-%d")

---

In [30]:
src_df = pd.read_csv(
    "/Users/stiles/data/barstool.csv",
    parse_dates=["week_start", "published_date", "timestamp"],
    dtype={"id": str},
)

In [31]:
len(src_df)

220809

#### Parse dates for aggregates

In [32]:
src_df["year"] = src_df["published_date"].dt.year
src_df["month"] = src_df["published_date"].dt.month
src_df["month_year"] = pd.to_datetime(
    (src_df["year"].astype(str) + "-" + src_df["month"].astype(str) + "-" + "01")
)
src_df.drop(["timestamp", "week_start"], axis=1, inplace=True)

In [33]:
df = src_df.copy()

In [34]:
df[df["title"].fillna("").str.contains("Rundown")]

Unnamed: 0,id,type,title,author_name,comment_count,brand_name,branch_url,img_url,tags,published_date,published_hour,published_day,first_tag,category_name,year,month,month_year
145,3431374,barstool_original,"Tommy's Office Hookup Brings The Roof Down | Barstool Rundown September 1, 2022",Michael Angelo,14,Barstool Rundown,https://bars.tl/3431374,https://chumley.barstoolsports.com/union/2022/09/01/9.1-THUMBNAIL.8532d31d.jpeg?crop=4%3A3%2Csmart&width=560,[],2022-09-01,18,Thursday,,Boston,2022,9,2022-09-01
237,3431129,barstool_original,"The New Winnie The Pooh Movie Is Nightmare Fuel - Barstool Rundown - August 31, 2022",Michael Angelo,4,Barstool Rundown,https://bars.tl/3431129,https://chumley.barstoolsports.com/union/2022/08/31/THUMB-8.31.22336043.jpeg?crop=4%3A3%2Csmart&width=560,"['rundown', 'the-rundown', 'winnie-the-pooh', 'hilary-duff', 'mlb', 'barstool-chicago']",2022-08-31,18,Wednesday,rundown,Boston,2022,8,2022-08-01
309,3430904,barstool_original,"Jersey Jerry Reflects On Pooping Pants - Barstool Rundown - August 30, 2022",Michael Angelo,6,Barstool Rundown,https://bars.tl/3430904,https://chumley.barstoolsports.com/union/2022/08/30/8.30-THUMB.5ef9b1bd.jpeg?crop=4%3A3%2Csmart&width=560,[],2022-08-30,18,Tuesday,,Boston,2022,8,2022-08-01
385,3430692,barstool_original,"Is Yung Gravy Dating Addison Rae's Mom? - Barstool Rundown - August 29, 2022",Michael Angelo,8,Barstool Rundown,https://bars.tl/3430692,https://chumley.barstoolsports.com/union/2022/08/29/8.29-THUMB.f8cc43f9.jpeg?crop=4%3A3%2Csmart&width=560,"['sports', 'nfl', 'el-presidente', 'college-football', 'nebraska', 's', 'aaron-rodger', 'aaron-donald', 'cleveland-browns', 'sydney-sweeney', 'yung-gravy']",2022-08-29,18,Monday,sports,Boston,2022,8,2022-08-01
571,3430222,barstool_original,"Week 0 of CFB Is Here - Barstool Rundown - August 25, 2022",Michael Angelo,5,Barstool Rundown,https://bars.tl/3430222,https://chumley.barstoolsports.com/union/2022/08/25/THUMBNAIL-8.25-Large.193338f6.jpeg?canvas=4%3A3&bg-color=000000&width=560,"['sports', 'college', 'el-presidente', 'chicago', 'week-0', 'monkey-pox', 'len-dawson']",2022-08-25,18,Thursday,sports,Boston,2022,8,2022-08-01
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
206200,189223,standard_post,Barstool Rundown - March 31,hubbs,0,,,https://chumley.barstoolsports.com/union/getty/2022/07/25/GettyImages-1410364892.c004d22e.jpeg?crop=4%3A3%2Csmart&width=560,[],2014-03-31,19,Monday,,BarstoolU,2014,3,2014-03-01
206256,1080450,barstool_original,Gronk On The Rundown,Dante,0,Barstool Originals,https://bars.tl/eM8lAoDCZP,https://chumley.barstoolsports.com/union/getty/2022/07/23/GettyImages-1217774756.8669e696.jpeg?crop=4%3A3%2Csmart&width=560,"['gold', 'throwback', 'barstool gold']",2014-03-30,10,Sunday,gold,Chicago,2014,3,2014-03-01
206319,188695,standard_post,Barstool Rundown - March 27th,Ohios Tate,0,,,https://chumley.barstoolsports.com/union/2022/07/21/bdc.58cbe6ea.jpg?crop=0.66%2C0.33%2Cx0.12%2Cy0.67%2Csafe&width=560,[],2014-03-27,20,Thursday,,Boston,2014,3,2014-03-01
206371,86889,standard_post,Barstool Sports Internet Rundown March 26th,Jersey Jerry,0,,,https://chumley.barstoolsports.com/union/getty/2021/05/03/GettyImages-1307507053.466a7f47.jpeg?crop=4%3A3%2Csmart&width=560,[],2014-03-26,22,Wednesday,,New York,2014,3,2014-03-01
