# Imagery Service Analysis

Analysis of OpenStreetMap changesets that use imagery services from the imagery_used column. The imagery tag is set automatically by iD, Vespucci and Go Map!!. As other editors are not using it and iD is vastly more popular than other relevant editors this graph is very close to 'market share of iD by edit volume'. JOSM users are typically using source field to note actually used sources.

In [1]:
import duckdb
import util

util.init()

## Monthly Percentage of Edits and Contributors Using Imagery Services

In [2]:
df = duckdb.sql("""
WITH monthly_with_imagery AS (
    SELECT 
        year,
        month,
        CONCAT(year, '-', LPAD(CAST(month as VARCHAR), 2, '0')) as months,
        COUNT(DISTINCT user_name) as contributors_with_imagery,
        SUM(edit_count) as edits_with_imagery
    FROM '../changeset_data/year=*/month=*/*.parquet'
    WHERE imagery_used IS NOT NULL
    GROUP BY year, month
),
monthly_total AS (
    SELECT 
        year,
        month,
        CONCAT(year, '-', LPAD(CAST(month as VARCHAR), 2, '0')) as months,
        COUNT(DISTINCT user_name) as total_contributors,
        SUM(edit_count) as total_edits
    FROM '../changeset_data/year=*/month=*/*.parquet'
    GROUP BY year, month
)
SELECT 
    mt.months,
    COALESCE(ROUND((mwi.contributors_with_imagery * 100.0) / mt.total_contributors, 2), 0) as 'Percentage Contributors with Imagery',
    COALESCE(ROUND((mwi.edits_with_imagery * 100.0) / mt.total_edits, 2), 0) as 'Percentage Edits with Imagery'
FROM monthly_total mt
LEFT JOIN monthly_with_imagery mwi ON mt.year = mwi.year AND mt.month = mwi.month
ORDER BY mt.year, mt.month
""").df()

util.show_figure(
    [
        util.FigureConfig(
            title="Monthly Percentage of Contributors Using Imagery Services",
            label="Contributors",
            x_col="months",
            y_col="Percentage Contributors with Imagery",
            y_unit_hover_template="%",
            query_or_df=df,
        ),
        util.FigureConfig(
            title="Monthly Percentage of Edits Using Imagery Services",
            label="Edits",
            x_col="months",
            y_col="Percentage Edits with Imagery",
            y_unit_hover_template="%",
            query_or_df=df,
        ),
    ]
)

## Monthly Top 10 Imagery Services: Edits, Accumulated Edits, Contributors and Accumulated Contributors

In [3]:
# Get top 10 imagery services by total edits
df = duckdb.sql("""
WITH imagery_expanded AS (
    SELECT 
        year,
        month,
        user_name,
        edit_count,
        unnest(imagery_used) as imagery_service
    FROM '../changeset_data/year=*/month=*/*.parquet'
    WHERE imagery_used IS NOT NULL
),
top_imagery AS (
    SELECT imagery_service
    FROM (
        SELECT
            imagery_service,
            SUM(edit_count) as total_edits
        FROM imagery_expanded
        GROUP BY imagery_service
        ORDER BY total_edits DESC
        LIMIT 10
    )
),
monthly_imagery_data AS (
    SELECT 
        ie.year,
        ie.month,
        CONCAT(ie.year, '-', LPAD(CAST(ie.month as VARCHAR), 2, '0')) as months,
        ie.imagery_service,
        COUNT(DISTINCT ie.user_name) as "Contributors",
        SUM(ie.edit_count) as "Edits"
    FROM imagery_expanded ie
    WHERE ie.imagery_service IN (SELECT imagery_service FROM top_imagery)
    GROUP BY ie.year, ie.month, ie.imagery_service
)
SELECT 
    months,
    imagery_service,
    "Contributors",
    "Edits",
    SUM("Contributors") OVER (PARTITION BY imagery_service ORDER BY year, month) as "Contributors Accumulated",
    SUM("Edits") OVER (PARTITION BY imagery_service ORDER BY year, month) as "Edits Accumulated"
FROM monthly_imagery_data
ORDER BY year, month, imagery_service
""").df()

util.show_figure(
    [
        util.FigureConfig(
            title="Monthly Edits by Top 10 Imagery Services",
            label="Edits",
            x_col="months",
            y_col="Edits",
            group_col="imagery_service",
            query_or_df=df,
        ),
        util.FigureConfig(
            title="Accumulated Edits by Top 10 Imagery Services",
            label="Edits Accumulated",
            x_col="months",
            y_col="Edits Accumulated",
            group_col="imagery_service",
            query_or_df=df,
        ),
        util.FigureConfig(
            title="Monthly Contributors by Top 10 Imagery Services",
            label="Contributors",
            x_col="months",
            y_col="Contributors",
            group_col="imagery_service",
            query_or_df=df,
        ),
        util.FigureConfig(
            title="Accumulated Contributors by Top 10 Imagery Services",
            label="Contributors Accumulated",
            x_col="months",
            y_col="Contributors Accumulated",
            group_col="imagery_service",
            query_or_df=df,
        ),
    ]
)

## Top 100 Imagery Services Yearly

In [4]:
import json

# Load replacement rules for clickable links
with open("../config/replace_rules_imagery_and_source.json") as f:
    imagery_name_to_html_link = {
        name: f'<a href="{item["link"]}">{name}</a>' for name, item in json.load(f).items() if "link" in item
    }

query = """
WITH imagery_expanded AS (
    SELECT 
        year,
        user_name,
        edit_count,
        unnest(imagery_used) as imagery_service
    FROM '../changeset_data/year=*/month=*/*.parquet'
    WHERE imagery_used IS NOT NULL
),
user_first_year AS (
    SELECT 
        user_name,
        imagery_service,
        MIN(year) as first_year
    FROM imagery_expanded
    GROUP BY user_name, imagery_service
),
imagery_totals AS (
    SELECT
        imagery_service as "Imagery Service",
        CAST(SUM(edit_count) as BIGINT) as total_edits_all_time,
        CAST(SUM(CASE WHEN year >= 2021 THEN edit_count ELSE 0 END) as BIGINT) as total_edits_2021_now,
        CAST(COUNT(DISTINCT user_name) as BIGINT) as total_contributors_all_time,
        CAST(COUNT(DISTINCT CASE WHEN year >= 2021 THEN user_name END) as BIGINT) as total_contributors_2021_now
    FROM imagery_expanded
    GROUP BY imagery_service
),
yearly_metrics AS (
    SELECT
        ie.year,
        ie.imagery_service as "Imagery Service",
        CAST(SUM(ie.edit_count) as BIGINT) as "Edits",
        CAST(COUNT(DISTINCT ie.user_name) as BIGINT) as "Contributors",
        CAST(COUNT(DISTINCT CASE WHEN ufy.first_year = ie.year THEN ie.user_name END) as BIGINT) as "New Contributors"
    FROM imagery_expanded ie
    LEFT JOIN user_first_year ufy 
        ON ie.user_name = ufy.user_name AND ie.imagery_service = ufy.imagery_service
    GROUP BY ie.year, ie.imagery_service
)
SELECT 
    ym.year,
    ym."Imagery Service",
    ym."Edits",
    ym."New Contributors",
    ym."Contributors",
    it.total_edits_all_time as "Total Edits",
    it.total_edits_2021_now as "Total Edits (2021 - Now)",
    it.total_contributors_all_time as "Total Contributors",
    it.total_contributors_2021_now as "Total Contributors (2021 - Now)"
FROM yearly_metrics ym
JOIN imagery_totals it
    ON ym."Imagery Service" = it."Imagery Service"
ORDER BY year DESC, "Edits" DESC
"""
df = duckdb.sql(query).df()

# Apply HTML links to imagery service names
df["Imagery Service"] = df["Imagery Service"].apply(
    lambda name: imagery_name_to_html_link[name] if name in imagery_name_to_html_link else name
)

top_100_contributors = df.groupby("Imagery Service")["Total Contributors"].first().nlargest(100)
top_100_contributors_2021_now = df.groupby("Imagery Service")["Total Contributors (2021 - Now)"].first().nlargest(100)
top_100_edits = df.groupby("Imagery Service")["Total Edits"].first().nlargest(100)
top_100_edits_2021_now = df.groupby("Imagery Service")["Total Edits (2021 - Now)"].first().nlargest(100)

table_configs = [
    util.TableConfig(
        title="Top 100 Imagery Services by Contributors",
        query_or_df=df[df["Imagery Service"].isin(top_100_contributors.index)],
        x_axis_col="year",
        y_axis_col="Imagery Service",
        value_col="Contributors",
        center_columns=["Rank", "Imagery Service"],
        sum_col="Total Contributors",
    ),
    util.TableConfig(
        title="Top 100 Imagery Services by Contributors 2021 - Now",
        query_or_df=df[(df["Imagery Service"].isin(top_100_contributors_2021_now.index)) & (df["year"] >= 2021)],
        x_axis_col="year",
        y_axis_col="Imagery Service",
        value_col="Contributors",
        center_columns=["Rank", "Imagery Service"],
        sum_col="Total Contributors (2021 - Now)",
    ),
    util.TableConfig(
        title="Top 100 Imagery Services by Edits",
        query_or_df=df[df["Imagery Service"].isin(top_100_edits.index)],
        x_axis_col="year",
        y_axis_col="Imagery Service",
        value_col="Edits",
        center_columns=["Rank", "Imagery Service"],
        sum_col="Total Edits",
    ),
    util.TableConfig(
        title="Top 100 Imagery Services by Edits 2021 - Now",
        query_or_df=df[(df["Imagery Service"].isin(top_100_edits_2021_now.index)) & (df["year"] >= 2021)],
        x_axis_col="year",
        y_axis_col="Imagery Service",
        value_col="Edits",
        center_columns=["Rank", "Imagery Service"],
        sum_col="Total Edits (2021 - Now)",
    ),
]

util.show_tables(table_configs)

Rank,Imagery Service,2013,2014,2015,2016,2017,2018,2019,2020,2021,2022,2023,2024,2025,Total Contributors
1,Bing Aerial Imagery,55606,123437,130064,134295,166720,174812,155602,169325,151032,126243,148789,153769,118205,1297720
2,.gpx data file,835,4243,7927,28777,45339,50670,47816,76173,82985,52319,45790,11851,8798,367030
3,Maxar Imagery,0,0,0,0,0,0,17936,35634,53021,48224,30163,221,10,150593
4,Esri World Imagery,0,0,0,1,4439,14942,19510,25003,23783,21113,34686,34227,28701,141204
5,Custom,345,1807,4729,9193,19536,12985,14523,37108,30860,4339,2912,3622,2898,128037
6,OpenStreetMap (Standard),0,0,0,1444,10559,12257,12768,11741,13993,13432,14584,14558,12125,84190
7,Mapbox Satellite,0,4168,6217,9999,9165,7459,8491,10857,14309,11113,17925,11016,8716,82594
8,BDOrtho,0,0,0,0,0,9870,12262,14168,13363,12923,13228,13109,9070,60844
9,.geojson data file,0,0,0,0,9,87,165,572,334,320,9326,36367,19401,60710
10,DigitalGlobe Imagery (now Maxar),0,0,0,1,14193,19685,12718,14,3,3,0,0,0,38697

Rank,Imagery Service,2021,2022,2023,2024,2025,Total Contributors (2021 - Now)
1,Bing Aerial Imagery,151032,126243,148789,153769,118205,542714
2,.gpx data file,82985,52319,45790,11851,8798,167376
3,Maxar Imagery,53021,48224,30163,221,10,113911
4,Esri World Imagery,23783,21113,34686,34227,28701,103676
5,.geojson data file,334,320,9326,36367,19401,60046
6,OpenStreetMap (Standard),13993,13432,14584,14558,12125,51519
7,Mapbox Satellite,14309,11113,17925,11016,8716,46543
8,BDOrtho,13363,12923,13228,13109,9070,40886
9,Custom,30860,4339,2912,3622,2898,40643
10,Geoportal 2: Orthophotomap,3270,5698,5749,6105,5290,17033

Rank,Imagery Service,2013,2014,2015,2016,2017,2018,2019,2020,2021,2022,2023,2024,2025,Total Edits
1,Bing Aerial Imagery,33882695,102551137,127200383,154939534,203958508,183015615,177464191,239303884,243368655,205560780,254642782,274891627,198763263,2399543054
2,Esri World Imagery,0,0,0,8,8452318,41922790,69786424,113631814,106377435,82663849,122441623,148005806,128594402,821876469
3,.gpx data file,219453,2565207,5555288,39532319,70750740,67934692,65209260,121075954,151036878,88886447,63041063,16292555,11523927,703623783
4,Maxar Imagery,0,0,0,0,0,0,63924802,138610588,158825063,140911869,67907783,82436,898,570263439
5,Mapbox Satellite,0,3438803,6033692,14574532,13465198,20838123,28249746,34429282,31625489,25024742,32817512,20543649,15368703,246409471
6,Custom,231494,2719162,6473638,12789661,23112184,20144383,17379655,36613661,36271610,14597768,12948468,18489524,14956233,216727441
7,Mapillary,0,0,0,503212,1485555,2538209,15494180,56091552,47080275,10665691,7770636,5969811,5432229,153031350
8,DigitalGlobe Imagery (now Maxar),0,0,0,1539,25354277,57809845,39323760,22270,115,330,0,0,0,122512136
9,Japan GSI,0,0,40938,2466320,3347234,8117710,14025690,11690505,13763789,15521406,15615869,16760078,12212014,113561553
10,.geojson data file,0,0,0,0,2331,92987,331436,2270091,1064008,1601530,12544902,46627720,35805147,100340152

Rank,Imagery Service,2021,2022,2023,2024,2025,Total Edits (2021 - Now)
1,Bing Aerial Imagery,243368655,205560780,254642782,274891627,198763263,1177227107
2,Esri World Imagery,106377435,82663849,122441623,148005806,128594402,588083115
3,Maxar Imagery,158825063,140911869,67907783,82436,898,367728049
4,.gpx data file,151036878,88886447,63041063,16292555,11523927,330780870
5,Mapbox Satellite,31625489,25024742,32817512,20543649,15368703,125380095
6,.geojson data file,1064008,1601530,12544902,46627720,35805147,97643307
7,Custom,36271610,14597768,12948468,18489524,14956233,97263603
8,Geoportal 2: Orthophotomap,10916550,15540071,18561472,19505231,14001319,78524643
9,Mapillary,47080275,10665691,7770636,5969811,5432229,76918642
10,Japan GSI,13763789,15521406,15615869,16760078,12212014,73873156
