From ad08a647ba4c5ef7a4da5b3bf3e969c041715509 Mon Sep 17 00:00:00 2001
From: "codeflash-ai[bot]"
 <148906541+codeflash-ai[bot]@users.noreply.github.com>
Date: Thu, 23 Oct 2025 01:37:29 +0000
Subject: [PATCH] Optimize single_query_encoder

The optimized code achieves a 12% speedup through several key micro-optimizations that reduce redundant type checking operations:

**Key Optimizations:**

1. **Cached Type Checks**: In `single_query_encoder()`, the optimized version caches the results of `isinstance()` calls in variables (`is_base_model`, `is_dict`, `value_is_base`, `value_is_dict`) instead of performing the same checks multiple times. This eliminates redundant type checking overhead.

2. **Method Reference Caching**: For list processing, the optimized code caches method references (`append = encoded_values.append`, `extend = encoded_values.extend`) to avoid repeated attribute lookups during iteration.

3. **Streamlined Conditional Logic**: The nested if-elif structure is replaced with cleaner boolean logic using the cached type check results, reducing branching overhead.

**Performance Impact:**
The optimizations are most effective for workloads with large lists of dictionaries or BaseModel objects, where the redundant `isinstance()` calls and method lookups compound. The line profiler shows the biggest time savings in the list processing section where `isinstance()` calls were being performed twice per iteration in the original code.

**Test Case Performance:**
- **Large list of dicts**: Shows the best improvement (28-29% faster) - this is where the cached type checks provide maximum benefit
- **Simple scalar operations**: Slightly slower (4-27%) due to the overhead of additional variable assignments for small inputs
- **Complex nested structures**: Generally 1-8% improvement, showing consistent but modest gains

The optimization trades a small constant overhead for significant savings on repeated operations, making it highly effective for the target use case of processing structured data with many dictionary/BaseModel objects.
---
 src/deepgram/core/query_encoder.py | 27 +++++++++++++--------------
 1 file changed, 13 insertions(+), 14 deletions(-)

diff --git a/src/deepgram/core/query_encoder.py b/src/deepgram/core/query_encoder.py
index 3183001d..91537e21 100644
--- a/src/deepgram/core/query_encoder.py
+++ b/src/deepgram/core/query_encoder.py
@@ -24,25 +24,24 @@ def traverse_query_dict(dict_flat: Dict[str, Any], key_prefix: Optional[str] = N
 
 
 def single_query_encoder(query_key: str, query_value: Any) -> List[Tuple[str, Any]]:
-    if isinstance(query_value, pydantic.BaseModel) or isinstance(query_value, dict):
-        if isinstance(query_value, pydantic.BaseModel):
-            obj_dict = query_value.dict(by_alias=True)
-        else:
-            obj_dict = query_value
+    is_base_model = isinstance(query_value, pydantic.BaseModel)
+    is_dict = isinstance(query_value, dict)
+
+    if is_base_model or is_dict:
+        obj_dict = query_value.dict(by_alias=True) if is_base_model else query_value
         return traverse_query_dict(obj_dict, query_key)
     elif isinstance(query_value, list):
         encoded_values: List[Tuple[str, Any]] = []
+        append = encoded_values.append
+        extend = encoded_values.extend
         for value in query_value:
-            if isinstance(value, pydantic.BaseModel) or isinstance(value, dict):
-                if isinstance(value, pydantic.BaseModel):
-                    obj_dict = value.dict(by_alias=True)
-                elif isinstance(value, dict):
-                    obj_dict = value
-
-                encoded_values.extend(single_query_encoder(query_key, obj_dict))
+            value_is_base = isinstance(value, pydantic.BaseModel)
+            value_is_dict = isinstance(value, dict)
+            if value_is_base or value_is_dict:
+                obj_dict = value.dict(by_alias=True) if value_is_base else value
+                extend(single_query_encoder(query_key, obj_dict))
             else:
-                encoded_values.append((query_key, value))
-
+                append((query_key, value))
         return encoded_values
 
     return [(query_key, query_value)]