From 2e31e936aadcfa3a6035d7d97f5242a4323a9963 Mon Sep 17 00:00:00 2001
From: "codeflash-ai[bot]"
 <148906541+codeflash-ai[bot]@users.noreply.github.com>
Date: Thu, 30 Oct 2025 09:07:42 +0000
Subject: [PATCH] Optimize accumulate_delta
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

The optimization achieves a 13% speedup through three key changes:

**1. Eliminated Function Call Overhead:**
Replaced custom `is_dict()` and `is_list()` wrapper functions with direct `isinstance()` calls. The line profiler shows `is_dict()` was called 1,809 times, consuming 358µs. Direct `isinstance()` calls eliminate this overhead since Python's C-implemented `isinstance()` is highly optimized.

**2. Optimized Set Membership Check:**
Changed `if key == "index" or key == "type":` to `if key in {"index", "type"}:`. Set membership testing is faster than chained equality comparisons, especially when called frequently (4,109 times according to the profiler).

**3. Improved List Type Checking:**
Replaced `all(isinstance(x, (str, int, float)) for x in acc_value)` with an explicit loop that breaks early. This avoids potential generator overhead and provides better control flow for the type checking logic.

**Performance Impact by Test Case:**
- **List operations see the biggest gains** (24-66% faster): The elimination of function call overhead in list processing provides substantial benefits for cases like `test_accumulate_simple_list_of_scalars` and `test_accumulate_lists_of_primitives`.
- **Nested dictionary operations** show 16-39% improvements due to reduced overhead in recursive calls.
- **Simple scalar operations** see modest 3-7% gains from the set membership optimization.
- **Large-scale tests** demonstrate consistent 2-27% improvements, showing the optimizations scale well.

These optimizations are particularly effective for workloads with frequent list processing and nested dictionary operations, which are common in streaming data accumulation scenarios.
---
 src/openai/lib/streaming/_assistants.py | 20 +++++++++++++-------
 1 file changed, 13 insertions(+), 7 deletions(-)

diff --git a/src/openai/lib/streaming/_assistants.py b/src/openai/lib/streaming/_assistants.py
index 6efb3ca3f1..989fddc468 100644
--- a/src/openai/lib/streaming/_assistants.py
+++ b/src/openai/lib/streaming/_assistants.py
@@ -7,7 +7,7 @@
 
 import httpx
 
-from ..._utils import is_dict, is_list, consume_sync_iterator, consume_async_iterator
+from ..._utils import consume_sync_iterator, consume_async_iterator
 from ..._compat import model_dump
 from ..._models import construct_type
 from ..._streaming import Stream, AsyncStream
@@ -994,7 +994,7 @@ def accumulate_delta(acc: dict[object, object], delta: dict[object, object]) ->
         #
         # the same applies to `type` properties as they're used for
         # discriminated unions
-        if key == "index" or key == "type":
+        if key in {"index", "type"}:
             acc[key] = delta_value
             continue
 
@@ -1002,17 +1002,23 @@ def accumulate_delta(acc: dict[object, object], delta: dict[object, object]) ->
             acc_value += delta_value
         elif isinstance(acc_value, (int, float)) and isinstance(delta_value, (int, float)):
             acc_value += delta_value
-        elif is_dict(acc_value) and is_dict(delta_value):
+        elif isinstance(acc_value, dict) and isinstance(delta_value, dict):
             acc_value = accumulate_delta(acc_value, delta_value)
-        elif is_list(acc_value) and is_list(delta_value):
+        elif isinstance(acc_value, list) and isinstance(delta_value, list):
             # for lists of non-dictionary items we'll only ever get new entries
             # in the array, existing entries will never be changed
-            if all(isinstance(x, (str, int, float)) for x in acc_value):
+            # Fast check for homogeneous types
+            acc_value_is_strintfloat = True
+            for x in acc_value:
+                if not isinstance(x, (str, int, float)):
+                    acc_value_is_strintfloat = False
+                    break
+            if acc_value_is_strintfloat:
                 acc_value.extend(delta_value)
                 continue
 
             for delta_entry in delta_value:
-                if not is_dict(delta_entry):
+                if not isinstance(delta_entry, dict):
                     raise TypeError(f"Unexpected list delta entry is not a dictionary: {delta_entry}")
 
                 try:
@@ -1028,7 +1034,7 @@ def accumulate_delta(acc: dict[object, object], delta: dict[object, object]) ->
                 except IndexError:
                     acc_value.insert(index, delta_entry)
                 else:
-                    if not is_dict(acc_entry):
+                    if not isinstance(acc_entry, dict):
                         raise TypeError("not handled yet")
 
                     acc_value[index] = accumulate_delta(acc_entry, delta_entry)