# Wildfire frequency and size in the U.S. 

#### Python tools

In [1]:
import pandas as pd
import altair as alt
import altair_stiles as altstiles

In [2]:
alt.themes.register("stiles", altstiles.theme)
alt.themes.enable("stiles")

ThemeRegistry.enable('grid')

#### Get summary data from the National Interagency Fire Center

In [3]:
src_df = pd.read_html('https://www.nifc.gov/fire-information/statistics/wildfires')[0]

#### Remove strings from top and bottom of table

In [4]:
src = src_df.iloc[3:-1].reset_index(drop=True)

#### Column names

In [5]:
src.columns = ['year', 'fires', 'acres']

#### Clean up messy values and datatypes

In [6]:
src['acres'] = src['acres'].str.replace('*', "", regex=False).str.replace(',', "", regex=False)

In [7]:
src[['fires', 'acres']] = src[['fires', 'acres']].astype(int)

#### Clean dataframe

In [8]:
df=src.sort_values('year').copy()

---

#### Acres per fire

In [9]:
df['acres_per_fire'] = (df['acres'] / df['fires']).round()

#### Five year rolling average of that average

In [10]:
df['acres_per_fire_rolling'] = df['acres_per_fire'].rolling(window=5).mean()

#### Chart it

In [11]:
alt.Chart(df).mark_line().encode(
    x='year:T',
    y='acres_per_fire_rolling'
)

#### Export

In [12]:
df.to_csv('data/processed/usa_wildfires_years_acres_average.csv', index=False)