In [1]:
from ethpandaops_python.hypersync import Hypersync
from ethpandaops_python.preprocessor import Preprocessor
from holoviews import opts
import nest_asyncio
import polars as pl
import panel as pn


nest_asyncio.apply()
pn.extension("plotly", template="material", sizing_mode="stretch_width")
pl.Config.set_fmt_str_lengths(200)
pl.Config.set_fmt_float("full")

polars.config.Config

### Data Query

In [2]:
arbitrum: str = "0xC1b634853Cb333D3aD8663715b08f41A3Aec47cc"
base: str = "0x5050F69a9786F081509234F1a7F4684b5E5b76C9"
num_days: int = 5
preprocessor: Preprocessor = Preprocessor(
    blob_producer=base,
    period=num_days,
    network="mainnet",  # mainnet
)

client = Hypersync()

txs_df = client.query_txs(address=base.lower(), period=(num_days))

In [3]:
# get preprocessed data
slot_inclusion_df: pl.DataFrame = preprocessor.slot_inclusion()

In [4]:
processed_slot_inclusion_df = (
    slot_inclusion_df.drop_nulls()
    .drop(
        "meta_network_name",
        "block_root",
        "blob_size",
        "from",
        "to",
        "blob_hashes_length",
        "blob_sidecars_size",
    )
    # there is an outlier in the data that has an unusually high slot count, I think it might be an error with the xatu mempool data.
    # additionally there is currently a single tx with 5 blobs and 1 with 7. Since it's a single row, I think it's easier to just discard and ignore for now
    .filter(pl.col("slot inclusion rate") < 250)
    .filter(pl.col("slot inclusion rate (50 blob average)") < 40)
)

In [5]:
joined_processed_slot_inclusion_df = processed_slot_inclusion_df.join(
    txs_df, on="hash", how="left"
)

In [6]:
slot_inclusion_tx_df = (
    (
        joined_processed_slot_inclusion_df.with_columns(
            (pl.col("effective_gas_price") / 10**9)
            .round(3)
            .alias(
                "effective_gas_price_gwei"
            ),  # gas price in gwei that was paid, including priority fee
            (pl.col("max_fee_per_gas") / 10**9)
            .round(3)
            .alias(
                "max_fee_per_gas_gwei"
            ),  # max gas price in gwei that rollup is willing to pay
            (pl.col("max_priority_fee_per_gas") / 10**9)
            .round(3)
            # priority gas fee in gwei,
            .alias("max_priority_fee_per_gas_gwei"),
        )
    )
    .drop_nulls()
    .sort(by="submission_count", descending=True)
)

In [7]:
slot_inclusion_tx_df.head(5)

versioned_hash,nonce,event_date_time_min,event_date_time_max,fill_percentage,blob_gas,blob_gas_fee_cap,gas_price,gas_tip_cap,gas_fee_cap,hash,submission_count,slot,slot time,kzg_commitment,blob_empty_size,beacon_inclusion_time,slot inclusion rate,slot inclusion rate (50 blob average),slot target inclusion rate (2 slots),block_number,from_,to,gas,transaction_index,gas_price_right,effective_gas_price,gas_used,cumulative_gas_used,max_fee_per_gas,max_priority_fee_per_gas,effective_gas_price_gwei,max_fee_per_gas_gwei,max_priority_fee_per_gas_gwei
str,u64,datetime[ms],datetime[ms],f64,f64,f64,f64,f64,f64,str,u32,u32,datetime[ms],str,u32,f64,f64,f64,i32,i64,str,str,f64,i64,f64,f64,f64,f64,f64,f64,f64,f64,f64
"""0x0191095f5a3af3d9685cc9f45be3e1dd8ea8b89caca83b164172e337b6fb7824""",383167,2024-04-06 19:44:56.432,2024-04-06 19:44:57.288,97.34999999999998,786432,1000000000,30581383300,2000000000,30581383300,"""0xab2b775aa9c647223962e08e5017bfe98e74c7ca70d45af92548a13dec07087f""",1,8800724,2024-04-06 19:45:11,"""0xb5f0d52f8d6e4a2100e3347238407d611950997b827e4475a546f3de8050833741a5829f4750dbd41b1681f4ecb28778""",0,14.568,2,1.76,2,19598847,"""0x5050f69a9786f081509234f1a7f4684b5e5b76c9""","""0xff00000000000000000000000000000000008453""",21000,111,14544557645,14544557645,21000,8084200,30581383300,2000000000,14.545,30.581,2
"""0x01af2c1e4b015c8f881da4c34fa738b5b6c0280d2a7295a839fa767eb73adc16""",383167,2024-04-06 19:44:56.432,2024-04-06 19:44:57.288,97.34999999999998,786432,1000000000,30581383300,2000000000,30581383300,"""0xab2b775aa9c647223962e08e5017bfe98e74c7ca70d45af92548a13dec07087f""",1,8800724,2024-04-06 19:45:11,"""0x83c9022464f6f251345f667d5165dad9ee55e1e4e003b74ed84649c43e184d190fdb7497c251a197b37e7c09ea9d0b70""",0,14.568,2,1.76,2,19598847,"""0x5050f69a9786f081509234f1a7f4684b5e5b76c9""","""0xff00000000000000000000000000000000008453""",21000,111,14544557645,14544557645,21000,8084200,30581383300,2000000000,14.545,30.581,2
"""0x019cdb3ff2cbed01b05144f518a3b157d3fdf97b1e7257ce0164fc004932853e""",383167,2024-04-06 19:44:56.432,2024-04-06 19:44:57.288,97.34999999999998,786432,1000000000,30581383300,2000000000,30581383300,"""0xab2b775aa9c647223962e08e5017bfe98e74c7ca70d45af92548a13dec07087f""",1,8800724,2024-04-06 19:45:11,"""0xab01cbffecea0b006e6898d21f949b71acdeb860d9a5c8449ffc602dd6a731dfe57e994c564f0fb854a156674bfc1760""",20805,14.568,2,1.76,2,19598847,"""0x5050f69a9786f081509234f1a7f4684b5e5b76c9""","""0xff00000000000000000000000000000000008453""",21000,111,14544557645,14544557645,21000,8084200,30581383300,2000000000,14.545,30.581,2
"""0x013bc43d7887e47bc144c06a4c58d230c4cbc740b36a03ac446d4d3c03dc6dc5""",383167,2024-04-06 19:44:56.432,2024-04-06 19:44:57.288,97.34999999999998,786432,1000000000,30581383300,2000000000,30581383300,"""0xab2b775aa9c647223962e08e5017bfe98e74c7ca70d45af92548a13dec07087f""",1,8800724,2024-04-06 19:45:11,"""0x930262ebbbeb6ffb534087cd6a1f62fb46540e0d28aa8c5385a6b8faf9fc4c643b2348956b9816f19ffabff1c578a124""",0,14.568,2,1.76,2,19598847,"""0x5050f69a9786f081509234f1a7f4684b5e5b76c9""","""0xff00000000000000000000000000000000008453""",21000,111,14544557645,14544557645,21000,8084200,30581383300,2000000000,14.545,30.581,2
"""0x0178a8c8a98e5ad8982f8f3da002ff7dd9e1f3b04c7d2b233699758eb7ec6ddc""",383167,2024-04-06 19:44:56.432,2024-04-06 19:44:57.288,97.34999999999998,786432,1000000000,30581383300,2000000000,30581383300,"""0xab2b775aa9c647223962e08e5017bfe98e74c7ca70d45af92548a13dec07087f""",1,8800724,2024-04-06 19:45:11,"""0x86c626a89d47b8b60b7367672588988f9350ea8ee89da9abbdd7b38f302e6f60ec4cf08d6f7135575dc3bf157e4848c4""",0,14.568,2,1.76,2,19598847,"""0x5050f69a9786f081509234f1a7f4684b5e5b76c9""","""0xff00000000000000000000000000000000008453""",21000,111,14544557645,14544557645,21000,8084200,30581383300,2000000000,14.545,30.581,2


### Stats at a Glance

In [8]:
slot_inclusion_tx_df.select("slot inclusion rate").shape

(20812, 1)

In [9]:
slot_chance_bar_df = (
    slot_inclusion_tx_df.select("hash", "slot inclusion rate")
    .unique()
    .with_columns(
        pl.when(pl.col("slot inclusion rate") == 1)
        .then(True)
        .otherwise(False)
        .alias("1 slot"),
        pl.when(pl.col("slot inclusion rate") == 2)
        .then(True)
        .otherwise(False)
        .alias("2 slots"),
        pl.when(pl.col("slot inclusion rate") >= 3)
        .then(True)
        .otherwise(False)
        .alias("3+ slots"),
    )
    .with_columns(
        pl.col("1 slot").sum(),
        pl.col("2 slots").sum(),
        pl.col("3+ slots").sum(),
        # pl.col('4+ slots').sum()
    )
    .select("1 slot", "2 slots", "3+ slots")[0]
)

In [18]:
slot_chance_bar_chart = slot_chance_bar_df.plot.barh(
    ylabel="number of txs",
    title="Slot Inclusion Breakdown",
    stacked=True,
    width=1000,
    height=400,
)

In [19]:
slot_chance_bar_chart

### Slot Inclusion Time Charts

In [71]:
slot_inclusion_line_chart = (
    slot_inclusion_tx_df.drop_nulls()
    .select(
        "slot time",
        "slot inclusion rate",
        "slot inclusion rate (50 blob average)",
        "slot target inclusion rate (2 slots)",
        "submission_count",
    )
    .plot.line(
        x="slot time",
        y=[
            "slot inclusion rate",
            "slot inclusion rate (50 blob average)",
            "slot target inclusion rate (2 slots)",
        ],
        color=["blue", "red", "black"],
        ylabel="Beacon Block Inclusion (block)",
        xlabel="Slot Date Time",
        title="Historical Slot Inclusion",
        width=1000,
        height=400,
        shared_axes=True,
    )
)

### Priority Fee Effectiveness for Faster Slot Inclusion

In [72]:
priority_fee_premium_df = slot_inclusion_tx_df.with_columns(
    (
        (pl.col("max_priority_fee_per_gas_gwei") / pl.col("effective_gas_price_gwei"))
        * 100
    )
    .round(3)
    .alias("priority_fee_bid_percent_premium")
)

In [74]:
priority_fee_premium_chart = (
    (
        priority_fee_premium_df.select(
            "block_number",
            "max_priority_fee_per_gas_gwei",
            "effective_gas_price_gwei",
            "priority_fee_bid_percent_premium",
            "slot inclusion rate",
            "submission_count",
        )
        .unique()
        .sort(by="block_number")
        .with_columns(
            (
                # estimate min block gas by taking the gwei paid minus the priority fee
                pl.col("effective_gas_price_gwei")
                - pl.col("max_priority_fee_per_gas_gwei")
            ).alias("min_block_gas_gwei")
        )
        .with_columns(
            # calculate per tx gas fluctuations
            pl.col("min_block_gas_gwei").diff().abs().alias("gas_fluctuation_gwei")
        )
        .with_columns(
            (pl.col("gas_fluctuation_gwei") / pl.col("min_block_gas_gwei") * 100).alias(
                "gas_fluctuation_percent"
            )
        )
    )
    .group_by("slot inclusion rate")
    .agg(
        pl.col("gas_fluctuation_percent").mean(),
        pl.col("priority_fee_bid_percent_premium").mean(),
    )
    .sort(by="slot inclusion rate")
    .plot.scatter(
        x="slot inclusion rate",
        y="priority_fee_bid_percent_premium",
        ylabel="priority fee bid premium %",
        title="mean priority fee bid premium per slot inclusion rate",
        width=1000,
        height=400,
    )
)

In [75]:
priority_fee_premium_df = (
    priority_fee_premium_df.select(
        "block_number",
        "max_priority_fee_per_gas_gwei",
        "effective_gas_price_gwei",
        "priority_fee_bid_percent_premium",
        "slot inclusion rate",
        "submission_count",
    )
    .unique()
    .sort(by="block_number")
    .with_columns(
        (
            # estimate min block gas by taking the gwei paid minus the priority fee
            pl.col("effective_gas_price_gwei")
            - pl.col("max_priority_fee_per_gas_gwei")
        ).alias("min_block_gas_gwei")
    )
    .with_columns(
        # calculate per tx gas fluctuations
        pl.col("min_block_gas_gwei")
        .diff()
        .abs()
        .alias("gas_fluctuation_gwei")
    )
    .with_columns(
        (pl.col("gas_fluctuation_gwei") / pl.col("min_block_gas_gwei") * 100).alias(
            "gas_fluctuation_percent"
        )
    )
)

In [140]:
volin_chart = priority_fee_premium_df.sort(by="slot inclusion rate").plot.violin(
    y="priority_fee_bid_percent_premium",
    by="slot inclusion rate",
    c="slot inclusion rate",
    width=1000,
    height=400,
)

line_chart_bid_premium = (
    priority_fee_premium_df.group_by("slot inclusion rate")
    .agg(
        pl.col("priority_fee_bid_percent_premium").median(),
        pl.col("effective_gas_price_gwei").mean(),
    )
    .sort(by="slot inclusion rate")
    .rename(
        {
            "priority_fee_bid_percent_premium": "priority fee bid premium (%)",
            "effective_gas_price_gwei": "block gas price (gwei)",
        }
    )
    .plot.line(
        x="slot inclusion rate",
        y=["priority fee bid premium (%)", "block gas price (gwei)"],
        color=["g", "r"],
        ylabel="bid premium (%, gwei)",
        title="gas bid premium probability distributions",
    )
)

In [141]:
violin_line_gas_chart = volin_chart * line_chart_bid_premium

### Assemble Dashboard

In [148]:
dash = pn.Column(
    pn.pane.Markdown(
        """
        # EIP-4844 Slot Inclusion Dashboard

        ## About
        This dashboard shows detailed analytics for blobs and how fast they are included into the next slot as well as the efficiency of using EIP-1559 priority fees
        as a bidding mechanism for faster slot inclusion. As of April 11, 2024, the data is currently restricted to Base posting data over a 5 day period with 
        plans to open up to other rollups soon. This dashboard is made using [Xatu Data](https://github.com/ethpandaops/xatu-data?tab=readme-ov-file) for EL mempool and Beacon chain data and [Hypersync](https://github.com/enviodev/hypersync-client-python) 
        for transaction gas data for the [EIP-4844 data challenge](https://esp.ethereum.foundation/data-challenge-4844).

        ## Summary of Results
        - Blobs have a highly variable slot inclusion rate, with a nontrivial amount of blobs taking 3+ slots to be included.   
        - Higher EIP-1559 priority fees correlate with longer slot inclusion rates.
        - Uncertainty around block gas and priority fee bidding premiums increase with longer slot inclusion rates.
        
        ## Slot Inclusion Methodology
        When a transaction is resubmitted with updated gas parameters, the transaction hash changes. For example take this blob reference hash - 0x01c738cf37c911334c771f2295c060e5bd7d084f347e4334863336724934c59a. 
        On [etherscan](https://etherscan.io/tx/0x763d823c0f933c4d2eb84406b37aa2649753f2f563fa3ee6d27251c6a52a8d69) we can see that the transaction was replaced by the user. We can see on Ethernow that the transaction contains 
        the same blob reference hash in both the [original tx](https://www.ethernow.xyz/tx/0x763d823c0f933c4d2eb84406b37aa2649753f2f563fa3ee6d27251c6a52a8d69?batchIndex=1) and the [resubmitted tx](https://www.ethernow.xyz/tx/0x5a4094662bd05ff3639a8979927ab527e007a6925387951a9c1b3d2958b13a86?batchIndex=1).
        
        We can measure the total time that a blob hash sat in the mempool by subtracting the original tx was first seen from the slot time, when it eventually is finalized on the beacon chain. 
        In this particular example, the total time that the blob sat in the mempool was not from 18:56:27 to 18:57:11 (4 slots), but really 18:54:29 to 18:57:11 (14 slots)
            """
    ),
    pn.Column(
        pn.pane.Markdown(
            """
            ## Slot Inclusion Breakdown
            This bar chart represents the number of transactions that are being included within 1 slot, 2 slots, and 3+ slots. 
            * 1 slot = fastest possible inclusion time
            * 2 slots = good inclusion time
            * 3+ slots = slow inclusion time
            """
        ),
        slot_chance_bar_chart.opts(axiswise=True),
        pn.pane.Markdown(
            """
        ## Slot Inclusion Rates
        This time-series chartshows the slot inclusion performance over time from when it's first seen in the mempool to when it gets finalized in the beacon block.
        A 50 blob slot inclusion average is taken to smooth out the performance. The target slot inclusion rate is 2. To the right is the overall distribution of the slot inclusion rate.
        While a lot of blobs get finalized on the beacon chain within 1-2 blocks, there are still a non-trivial amount of outliers that can take upwards of 5-10 blocks before finalizing.
            """
        ),
        pn.Row(slot_inclusion_line_chart.opts(axiswise=True)),
        pn.pane.Markdown(
            """
        ## EIP-1559 Priority Fee Premium Correlation with Slot Rates
        The scatterplot shows the priority fee bid premium. There isn't a strong correlation between higher priority fee bid premiums and shorter slot inclusion rates. On the contrary,
        the longer it takes for the blob to be included, the priority fee bid premium starts to increase.
            """
        ),
        pn.Row(priority_fee_premium_chart),
        pn.pane.Markdown(
            """
        ## Slot Inclusion Bidding Unpredictability 
        This major takeaway is that uncertainty around both block gas and priority fee bidding tends to increase the longer the it takes for a blob to be included in a slot. There are three major 
        characteristics in the chart - one violin plot for the probability distribution and two trend lines for priority fee bids and block gas prices.
        * violin plots for each slot inclusion rate, showing the probability distribution of the priority gas bidding premium for each inclusion slot. 
        The higher the slot inclusion rate, the more uncertainty there is around 
        * the green line shows the median trend line for the priority fee bid premium (in %), which tends to drift higher as slot inclusion rate gets higher.
        * the red line shows the mean trend line for the block gas price (in gwei), which drifts upwards was slot inclusion rate gets higher.
            """
        ),
        pn.Row(violin_line_gas_chart),
    ),
)

In [149]:
# dash.show()
dash.servable()

BokehModel(combine_events=True, render_bundle={'docs_json': {'00c82a29-b5c0-4e0e-ae61-e07768253a6a': {'version…