In [1]:
import requests
import pandas as pd

# Endpoints
DEMAND_URL = "https://data.cdc.gov/resource/vjzj-u7u8.json"

# Pull samples
demand_response = requests.get(DEMAND_URL, params={"$limit": 100})

# Convert to DataFrames
demand_df = pd.DataFrame(demand_response.json())

# Explore
print("=== DEMAND DATA ===")
print(demand_df.info())
print(demand_df.head())



=== DEMAND DATA ===
<class 'pandas.core.frame.DataFrame'>
RangeIndex: 100 entries, 0 to 99
Data columns (total 4 columns):
 #   Column          Non-Null Count  Dtype 
---  ------          --------------  ----- 
 0   date            100 non-null    object
 1   pathogen        100 non-null    object
 2   geography       100 non-null    object
 3   percent_visits  100 non-null    object
dtypes: object(4)
memory usage: 3.3+ KB
None
                      date pathogen geography percent_visits
0  2022-09-25T00:00:00.000      ARI   Alabama          15.99
1  2022-09-26T00:00:00.000      ARI   Alabama          14.33
2  2022-09-27T00:00:00.000      ARI   Alabama          15.16
3  2022-09-28T00:00:00.000      ARI   Alabama          13.78
4  2022-09-29T00:00:00.000      ARI   Alabama           13.7


In [6]:
print("=== GEOGRAPHY VALUES ===")
print(demand_df['geography'].unique())

print("\n=== PATHOGEN VALUES ===")
print(demand_df['pathogen'].unique())

print("\n=== DATE RANGE ===")
print(demand_df['date'].min(), "to", demand_df['date'].max())

=== GEOGRAPHY VALUES ===
['Alabama']

=== PATHOGEN VALUES ===
['ARI']

=== DATE RANGE ===
2022-09-25T00:00:00.000 to 2023-01-02T00:00:00.000


In [7]:
# Check all pathogens
demand_full = requests.get(DEMAND_URL, params={"$select": "DISTINCT pathogen"})
print("PATHOGENS:", [r['pathogen'] for r in demand_full.json()])

# Check all geographies
demand_geo = requests.get(DEMAND_URL, params={"$select": "DISTINCT geography"})
print("GEOGRAPHIES:", [r['geography'] for r in demand_geo.json()])

# Check date range
demand_dates = requests.get(DEMAND_URL, params={
    "$select": "MIN(date) as min_date, MAX(date) as max_date"
})
print("DATE RANGE:", demand_dates.json())

PATHOGENS: ['COVID', 'RSV', 'Influenza', 'ARI']
GEOGRAPHIES: ['Kansas', 'Texas', 'Oregon', 'Idaho', 'Alaska', 'Alabama', 'United States', 'Oklahoma', 'North Carolina', 'Colorado', 'Mississippi', 'Florida', 'Vermont', 'Delaware', 'Nevada', 'Louisiana', 'New York', 'West Virginia', 'South Carolina', 'New Jersey', 'New Mexico', 'Hawaii', 'Arkansas', 'Connecticut', 'South Dakota', 'District of Columbia', 'Iowa', 'Indiana', 'Massachusetts', 'Rhode Island', 'Ohio', 'Michigan', 'Minnesota', 'Pennsylvania', 'Washington', 'Wisconsin', 'Montana', 'Kentucky', 'Arizona', 'Illinois', 'Virginia', 'Maryland', 'Georgia', 'Utah', 'Wyoming', 'New Hampshire', 'North Dakota', 'Nebraska', 'Maine', 'California', 'Tennessee']
DATE RANGE: [{'min_date': '2022-09-25T00:00:00.000', 'max_date': '2025-12-13T00:00:00.000'}]
