# Jupyter Notebook: Parsing CSV file and Visualizing Data

In this notebook, we will load a CSV file, convert it to a pandas DataFrame, and then create a map visualizations using folium.

In [1]:
pip install pandas folium


[1m[[0m[34;49mnotice[0m[1;39;49m][0m[39;49m A new release of pip available: [0m[31;49m22.3.1[0m[39;49m -> [0m[32;49m24.2[0m
[1m[[0m[34;49mnotice[0m[1;39;49m][0m[39;49m To update, run: [0m[32;49mpip3 install --upgrade pip[0m
Note: you may need to restart the kernel to use updated packages.


In [2]:
# Import necessary libraries
import pandas as pd
import folium

## Step 1: Load CSV File

In [3]:
# Load the CSV file into a DataFrame
file_path = "colorado_product_manufacturers_full_list.csv"

df = pd.read_csv(file_path)

# Optional: Display the first few rows to check if the file is loaded correctly
df.head(15)

Unnamed: 0,License Number,Facility Name,DBA,Facility Type,Street,City,State,Zip Code,Date Updated,Latitude,Longitude
0,404-00341,2306 N POWERS LLC,Hightops,Medical Marijuana Products Mfg,"2306 North Powers Frontage Road, Suite 100",Colorado Springs,CO,80915,2024-09-03,38.863467,-104.720079
1,404-00538,81082 LLC,Colorado Cannabis Exchange II,Medical Marijuana Products Mfg,123 Pine Street,Trinidad,CO,81082,2024-09-03,37.173006,-104.509181
2,404-00650,ACES PLACE LLC,Green Rooster Concentrates,Medical Marijuana Products Mfg,14621 County Road 98,Nunn,CO,80648,2024-09-03,40.696002,-104.775428
3,404-00510,ADAMS GREEN CROSSING LLC,,Medical Marijuana Products Mfg,"2727 Palmer Park Boulevard, Suite A",Colorado Springs,CO,80909,2024-09-03,38.853439,-104.777734
4,404-00498,AF INC,Apothecary Extracts,Medical Marijuana Products Mfg,3049 Delta Drive,Colorado Springs,CO,80910,2024-09-03,38.79516,-104.77684
5,404-00629,AF INC,Apothecary Extracts,Medical Marijuana Products Mfg,65 Precision Drive,Pueblo West,CO,81007,2024-09-03,38.335082,-104.727394
6,404-00493,ALLGREENS LLC,,Medical Marijuana Products Mfg,1235 South Huron Street,Denver,CO,80223,2024-09-03,39.694207,-104.996932
7,404-00472,AVICENNA PRODUCTS LLC,High Tech Concentrates,Medical Marijuana Products Mfg,3950 North Grape Street,Denver,CO,80207,2024-09-03,39.772075,-104.92454
8,404-00454,AVICENNA PRODUCTS LLC,High Tech Concentrates,Medical Marijuana Products Mfg,1822 South Bannock Street,Denver,CO,80223,2024-09-03,39.683521,-104.989639
9,404-00621,AVICENNA PRODUCTS LLC,High Tech Concentrates,Medical Marijuana Products Mfg,35715 US Highway 40 Building D Unit 106,Evergreen,CO,80439,2024-09-03,39.741408,-105.431886


## Step 2: Clean and Prepare the Data

In [4]:
# Check column names and data types
df.info()

# Clean any missing latitude or longitude data
df.dropna(subset=['Longitude', 'Latitude'], inplace=True)

# Optional: Check for missing values in other important columns
df.isnull().sum()

# Optional: Display the first few rows of cleaned data
df.head(15)

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 431 entries, 0 to 430
Data columns (total 11 columns):
 #   Column          Non-Null Count  Dtype  
---  ------          --------------  -----  
 0   License Number  431 non-null    object 
 1   Facility Name   431 non-null    object 
 2   DBA             306 non-null    object 
 3   Facility Type   431 non-null    object 
 4   Street          431 non-null    object 
 5   City            431 non-null    object 
 6   State           431 non-null    object 
 7   Zip Code        431 non-null    int64  
 8   Date Updated    431 non-null    object 
 9   Latitude        431 non-null    float64
 10  Longitude       431 non-null    float64
dtypes: float64(2), int64(1), object(8)
memory usage: 37.2+ KB


Unnamed: 0,License Number,Facility Name,DBA,Facility Type,Street,City,State,Zip Code,Date Updated,Latitude,Longitude
0,404-00341,2306 N POWERS LLC,Hightops,Medical Marijuana Products Mfg,"2306 North Powers Frontage Road, Suite 100",Colorado Springs,CO,80915,2024-09-03,38.863467,-104.720079
1,404-00538,81082 LLC,Colorado Cannabis Exchange II,Medical Marijuana Products Mfg,123 Pine Street,Trinidad,CO,81082,2024-09-03,37.173006,-104.509181
2,404-00650,ACES PLACE LLC,Green Rooster Concentrates,Medical Marijuana Products Mfg,14621 County Road 98,Nunn,CO,80648,2024-09-03,40.696002,-104.775428
3,404-00510,ADAMS GREEN CROSSING LLC,,Medical Marijuana Products Mfg,"2727 Palmer Park Boulevard, Suite A",Colorado Springs,CO,80909,2024-09-03,38.853439,-104.777734
4,404-00498,AF INC,Apothecary Extracts,Medical Marijuana Products Mfg,3049 Delta Drive,Colorado Springs,CO,80910,2024-09-03,38.79516,-104.77684
5,404-00629,AF INC,Apothecary Extracts,Medical Marijuana Products Mfg,65 Precision Drive,Pueblo West,CO,81007,2024-09-03,38.335082,-104.727394
6,404-00493,ALLGREENS LLC,,Medical Marijuana Products Mfg,1235 South Huron Street,Denver,CO,80223,2024-09-03,39.694207,-104.996932
7,404-00472,AVICENNA PRODUCTS LLC,High Tech Concentrates,Medical Marijuana Products Mfg,3950 North Grape Street,Denver,CO,80207,2024-09-03,39.772075,-104.92454
8,404-00454,AVICENNA PRODUCTS LLC,High Tech Concentrates,Medical Marijuana Products Mfg,1822 South Bannock Street,Denver,CO,80223,2024-09-03,39.683521,-104.989639
9,404-00621,AVICENNA PRODUCTS LLC,High Tech Concentrates,Medical Marijuana Products Mfg,35715 US Highway 40 Building D Unit 106,Evergreen,CO,80439,2024-09-03,39.741408,-105.431886


## Step 3: Create a Searchable Map

In [5]:
# Initialize the map centered around Colorado
m = folium.Map(location=[39.5501, -105.7821], zoom_start=7)

# Add markers to the map for each food pantry
for idx, row in df.iterrows():
    popup_text = f"""
    <strong>{row['Facility Name']}</strong><br>
    <strong>{row['DBA']}</strong><br>
    Facility Type: {row['Facility Type']}<br>
    {row['Street']}<br>
    {row['City']}, {row['State']} {row['Zip Code']}
    """
    folium.Marker(
        location=[row['Latitude'], row['Longitude']],
        popup=popup_text, icon=folium.Icon(icon="cloud",color="green")
    ).add_to(m)

# Save the map as an HTML file
m.save("colorado_product_manufacturers_full_list_map.html")

# Display the map in the notebook
m

## Step 4: Implement Search Functionality

In [6]:
# Example: Search for product manufacturers in a specific city
city_search = "Denver"  # Replace with user input

# Filter the DataFrame based on the city
filtered_df = df[df['City'].str.contains(city_search, case=False, na=False)]

# Create a map for the filtered results
m_filtered = folium.Map(location=[39.5501, -105.7821], zoom_start=7)

for idx, row in filtered_df.iterrows():
    popup_text = f"""
    <strong>{row['Facility Name']}</strong><br>
    <strong>{row['DBA']}</strong><br>
    Facility Type: {row['Facility Type']}<br>
    {row['Street']}<br>
    {row['City']}, {row['State']} {row['Zip Code']}
    """
    folium.Marker(
        location=[row['Latitude'], row['Longitude']],
        popup=popup_text, icon=folium.Icon(icon="cloud",color="green")
    ).add_to(m_filtered)

# Save the filtered map as an HTML file
m_filtered.save("filtered_colorado_product_manufacturers_map_denver.html")

# Display the filtered map in the notebook
m_filtered

In [7]:
# Example: Search for product manufacturers in a specific city
city_search = "Colorado Springs"  # Replace with user input

# Filter the DataFrame based on the city
filtered_df = df[df['City'].str.contains(city_search, case=False, na=False)]

# Create a map for the filtered results
m_filtered = folium.Map(location=[38.8591, -104.8135], zoom_start=7)

for idx, row in filtered_df.iterrows():
    popup_text = f"""
    <strong>{row['Facility Name']}</strong><br>
    <strong>{row['DBA']}</strong><br>
    Facility Type: {row['Facility Type']}<br>
    {row['Street']}<br>
    {row['City']}, {row['State']} {row['Zip Code']}
    """
    folium.Marker(
        location=[row['Latitude'], row['Longitude']],
        popup=popup_text, icon=folium.Icon(icon="cloud",color="green")
    ).add_to(m_filtered)

# Save the filtered map as an HTML file
m_filtered.save("filtered_colorado_product_manufacturers_map_colorado_springs.html")

# Display the filtered map in the notebook
m_filtered

In [8]:
# Example: Search for product manufacturers in a specific city
city_search = "Aurora"  # Replace with user input

# Filter the DataFrame based on the city
filtered_df = df[df['City'].str.contains(city_search, case=False, na=False)]

# Create a map for the filtered results
m_filtered = folium.Map(location=[39.7108, -104.8125], zoom_start=7)

for idx, row in filtered_df.iterrows():
    popup_text = f"""
    <strong>{row['Facility Name']}</strong><br>
    <strong>{row['DBA']}</strong><br>
    Facility Type: {row['Facility Type']}<br>
    {row['Street']}<br>
    {row['City']}, {row['State']} {row['Zip Code']}
    """
    folium.Marker(
        location=[row['Latitude'], row['Longitude']],
        popup=popup_text, icon=folium.Icon(icon="cloud",color="green")
    ).add_to(m_filtered)

# Save the filtered map as an HTML file
m_filtered.save("filtered_colorado_product_manufacturers_map_aurora.html")

# Display the filtered map in the notebook
m_filtered

In [9]:
# Example: Search for product manufacturers in a specific city
city_search = "Fort Collins"  # Replace with user input

# Filter the DataFrame based on the city
filtered_df = df[df['City'].str.contains(city_search, case=False, na=False)]

# Create a map for the filtered results
m_filtered = folium.Map(location=[40.5853, -105.0844], zoom_start=7)

for idx, row in filtered_df.iterrows():
    popup_text = f"""
    <strong>{row['Facility Name']}</strong><br>
    <strong>{row['DBA']}</strong><br>
    Facility Type: {row['Facility Type']}<br>
    {row['Street']}<br>
    {row['City']}, {row['State']} {row['Zip Code']}
    """
    folium.Marker(
        location=[row['Latitude'], row['Longitude']],
        popup=popup_text, icon=folium.Icon(icon="cloud",color="green")
    ).add_to(m_filtered)

# Save the filtered map as an HTML file
m_filtered.save("filtered_colorado_product_manufacturers_map_fort_collins.html")

# Display the filtered map in the notebook
m_filtered

In [12]:
# Example: Search for product manufacturers in a specific city
city_search = "Garden City"  # Replace with user input

# Filter the DataFrame based on the city
filtered_df = df[df['City'].str.contains(city_search, case=False, na=False)]

# Create a map for the filtered results
m_filtered = folium.Map(location=[40.4233, -104.7112], zoom_start=7)

for idx, row in filtered_df.iterrows():
    popup_text = f"""
    <strong>{row['Facility Name']}</strong><br>
    <strong>{row['DBA']}</strong><br>
    Facility Type: {row['Facility Type']}<br>
    {row['Street']}<br>
    {row['City']}, {row['State']} {row['Zip Code']}
    """
    folium.Marker(
        location=[row['Latitude'], row['Longitude']],
        popup=popup_text, icon=folium.Icon(icon="cloud",color="green")
    ).add_to(m_filtered)

# Save the filtered map as an HTML file
m_filtered.save("filtered_colorado_product_manufacturers_map_garden_city.html")

# Display the filtered map in the notebook
m_filtered

In [13]:
# Example: Search for product manufacturers in a specific city
city_search = "Pueblo"  # Replace with user input

# Filter the DataFrame based on the city
filtered_df = df[df['City'].str.contains(city_search, case=False, na=False)]

# Create a map for the filtered results
m_filtered = folium.Map(location=[38.2765, -104.6046], zoom_start=7)

for idx, row in filtered_df.iterrows():
    popup_text = f"""
    <strong>{row['Facility Name']}</strong><br>
    <strong>{row['DBA']}</strong><br>
    Facility Type: {row['Facility Type']}<br>
    {row['Street']}<br>
    {row['City']}, {row['State']} {row['Zip Code']}
    """
    folium.Marker(
        location=[row['Latitude'], row['Longitude']],
        popup=popup_text, icon=folium.Icon(icon="cloud",color="green")
    ).add_to(m_filtered)

# Save the filtered map as an HTML file
m_filtered.save("filtered_colorado_product_manufacturers_map_pueblo.html")

# Display the filtered map in the notebook
m_filtered

In [14]:
# Example: Search for product manufacturers in a specific city
city_search = "Boulder"  # Replace with user input

# Filter the DataFrame based on the city
filtered_df = df[df['City'].str.contains(city_search, case=False, na=False)]

# Create a map for the filtered results
m_filtered = folium.Map(location=[40.0150, -105.2705], zoom_start=7)

for idx, row in filtered_df.iterrows():
    popup_text = f"""
    <strong>{row['Facility Name']}</strong><br>
    <strong>{row['DBA']}</strong><br>
    Facility Type: {row['Facility Type']}<br>
    {row['Street']}<br>
    {row['City']}, {row['State']} {row['Zip Code']}
    """
    folium.Marker(
        location=[row['Latitude'], row['Longitude']],
        popup=popup_text, icon=folium.Icon(icon="cloud",color="green")
    ).add_to(m_filtered)

# Save the filtered map as an HTML file
m_filtered.save("filtered_colorado_product_manufacturers_map_boulder.html")

# Display the filtered map in the notebook
m_filtered

## Step 5: Export Cleaned Data to CSV 

In [16]:
# Export the cleaned DataFrame to a CSV file
df.to_csv("cleaned_colorado_product_manufacturers_full_list_v2.csv", index=False)

# Confirm the export
print("Data exported to colorado_product_manufacturers_full_list_v2.csv")

Data exported to colorado_product_manufacturers_full_list_v2.csv
