In [7]:
import pandas as pd

# Load cleaned metadata
df_core = pd.read_csv("cleaned_legal_metadata.csv")
df_core['decision_date'] = pd.to_datetime(df_core['decision_date'], errors='coerce')

# Template-based draft generator
def generate_baseline_draft(row):
    title = row['name_abbreviation']
    court = row['court/name_abbreviation']
    date = row['decision_date'].strftime('%B %d, %Y') if pd.notnull(row['decision_date']) else "an unknown date"
    docket = row['docket_number']
    
    draft = (
        f"{title}, filed in the {court} on {date}, under docket number {docket}."
    )
    return draft

# Apply to entire dataset
df_core['baseline_draft'] = df_core.apply(generate_baseline_draft, axis=1)

# Show a few examples
print(df_core[['name_abbreviation', 'baseline_draft']].head())

# Optional: Save output
df_core.to_csv("baseline_drafted_filings_v2.csv", index=False)



                                   name_abbreviation  \
0                              Olsen v. Nelnet, Inc.   
1  Am. Ctr. for Law & Justice v. U.S. Dep't of Ju...   
2                             United States v. Emery   
3                          Stearney v. United States   
4          In re German Auto. Mfrs. Antitrust Litig.   

                                      baseline_draft  
0  Olsen v. Nelnet, Inc., filed in the D. Neb. on...  
1  Am. Ctr. for Law & Justice v. U.S. Dep't of Ju...  
2  United States v. Emery, filed in the D. S.D. o...  
3  Stearney v. United States, filed in the D. Ari...  
4  In re German Auto. Mfrs. Antitrust Litig., fil...  
