From c95d5b36f4a5ff19ffbf8341a2538ec0a720793e Mon Sep 17 00:00:00 2001
From: Avikalp Kumar Gupta <avikalpgupta@gmail.com>
Date: Fri, 6 Jun 2025 16:43:07 -0400
Subject: [PATCH 1/7] Implement exponential backoff retry logic for OpenAI API
 calls in CodeAnalysisAgent

- Added a decorator to handle rate limit errors with exponential backoff and jitter.
- Refactored agent analysis execution to use the new retry logic.
- Enhanced dependency matching for components to allow more flexible name comparisons.
- Added functionality to track dependents in component relationships.
---
 diffgraph/ai_analysis.py | 54 +++++++++++++++++++++++++++++++++++++---
 1 file changed, 50 insertions(+), 4 deletions(-)

diff --git a/diffgraph/ai_analysis.py b/diffgraph/ai_analysis.py
index 44bbb48..3d028d0 100644
--- a/diffgraph/ai_analysis.py
+++ b/diffgraph/ai_analysis.py
@@ -3,6 +3,9 @@
 import os
 from pydantic import BaseModel
 from .graph_manager import GraphManager, FileStatus, ChangeType, ComponentNode
+import time
+import random
+import openai
 
 class FileChange(BaseModel):
     """Model representing a file change."""
@@ -15,6 +18,28 @@ class DiffAnalysis(BaseModel):
     summary: str
     mermaid_diagram: str
 
+def exponential_backoff_retry(func):
+    """Decorator to implement exponential backoff retry logic."""
+    def wrapper(*args, **kwargs):
+        max_retries = 5
+        base_delay = 1  # Start with 1 second
+        max_delay = 60  # Maximum delay of 60 seconds
+
+        for attempt in range(max_retries):
+            try:
+                return func(*args, **kwargs)
+            except openai.RateLimitError as e:
+                if attempt == max_retries - 1:  # Last attempt
+                    raise  # Re-raise the exception if all retries failed
+
+                # Calculate delay with exponential backoff and jitter
+                delay = min(base_delay * (2 ** attempt) + random.uniform(0, 1), max_delay)
+                print(f"Rate limit hit. Retrying in {delay:.2f} seconds...")
+                time.sleep(delay)
+            except Exception as e:
+                raise  # Re-raise other exceptions immediately
+    return wrapper
+
 class CodeAnalysisAgent:
     """Agent for analyzing code changes using OpenAI's Agents SDK."""
 
@@ -66,6 +91,12 @@ def _determine_change_type(self, status: str) -> ChangeType:
         else:
             return ChangeType.MODIFIED
 
+    @exponential_backoff_retry
+    def _run_agent_analysis(self, prompt: str) -> str:
+        """Run the agent analysis with retry logic."""
+        result = Runner.run_sync(self.agent, prompt)
+        return result.final_output
+
     def analyze_changes(self, files_with_content: List[Dict[str, str]]) -> DiffAnalysis:
         """
         Analyze code changes using the OpenAI agent, processing files incrementally.
@@ -114,9 +145,8 @@ def analyze_changes(self, files_with_content: List[Dict[str, str]]) -> DiffAnaly
                     for comp in processed_components:
                         prompt += f"- {comp.name}: {comp.summary}\n"
 
-                # Run the agent
-                result = Runner.run_sync(self.agent, prompt)
-                response_text = result.final_output
+                # Run the agent with retry logic
+                response_text = self._run_agent_analysis(prompt)
 
                 # Parse the response
                 summary = ""
@@ -166,12 +196,28 @@ def analyze_changes(self, files_with_content: List[Dict[str, str]]) -> DiffAnaly
                     for dep in comp.get("dependencies", []):
                         # Try to find the dependency in other components
                         for other_comp in self.graph_manager.component_nodes.values():
-                            if other_comp.name == dep:
+                            # More flexible matching - check if the dependency name is contained in the component name
+                            # or if the component name is contained in the dependency name
+                            if (dep.lower() in other_comp.name.lower() or
+                                other_comp.name.lower() in dep.lower()):
                                 self.graph_manager.add_component_dependency(
                                     f"{current_file}::{comp['name']}",
                                     f"{other_comp.file_path}::{other_comp.name}"
                                 )
 
+                    # Add dependents
+                    for dep in comp.get("dependents", []):
+                        # Try to find the dependent in other components
+                        for other_comp in self.graph_manager.component_nodes.values():
+                            # More flexible matching - check if the dependent name is contained in the component name
+                            # or if the component name is contained in the dependent name
+                            if (dep.lower() in other_comp.name.lower() or
+                                other_comp.name.lower() in dep.lower()):
+                                self.graph_manager.add_component_dependency(
+                                    f"{other_comp.file_path}::{other_comp.name}",
+                                    f"{current_file}::{comp['name']}"
+                                )
+
                 # Mark file as processed
                 self.graph_manager.mark_processed(current_file, summary, components)
 

From f9dac4d9ca3ee2e4002564072e715dbe46347b9a Mon Sep 17 00:00:00 2001
From: Avikalp Kumar Gupta <avikalpgupta@gmail.com>
Date: Sun, 8 Jun 2025 15:15:35 -0400
Subject: [PATCH 2/7] - add roadmap to properly implement agentic flow for
 diffgraph creation - all roadmap documents in the docs folder.

---
 docs/Roadmap-v0-demo.md                     | 202 ++++++++++++++++++++
 Roadmap.md => docs/Roadmap-v0-initialize.md |   0
 2 files changed, 202 insertions(+)
 create mode 100644 docs/Roadmap-v0-demo.md
 rename Roadmap.md => docs/Roadmap-v0-initialize.md (100%)

diff --git a/docs/Roadmap-v0-demo.md b/docs/Roadmap-v0-demo.md
new file mode 100644
index 0000000..23ae2bf
--- /dev/null
+++ b/docs/Roadmap-v0-demo.md
@@ -0,0 +1,202 @@
+# 📅 Roadmap: Modular Multi-Agent Architecture for diffgraph-ai
+
+This roadmap introduces a modular re-architecture of `diffgraph-ai`, aimed at improving the accuracy, extensibility, and quality of visual diff representations. The goal is to break up the existing monolithic agent prompt into smaller, specialized AI agents using the OpenAI Agents SDK.
+
+Each step is:
+
+* ✅ Independently testable
+* 🔁 Minimal, logical step in the pipeline
+* 📗 Documented with clarity for even junior developers or AI assistants to follow
+
+---
+
+## ✅ Step 1: Introduce Component-Level Visualization
+
+### 🌟 Objective:
+
+Update the `GraphManager` and Mermaid generation to render function- and class-level nodes instead of only file-level nodes.
+
+### 🔹 Definition of Done:
+
+The output HTML graph should show component nodes (e.g., `validateUser()`, `AuthService`) with their change type (added/modified/deleted).
+
+### ⚡ Implementation Plan:
+
+* Update `GraphManager.add_component` to always record components
+* Modify `get_mermaid_diagram()` to include and render component-level nodes with styles
+* Use stub data if needed (before real extraction logic works)
+
+### 🔧 Implementation Details:
+
+* Use unique node IDs: `file_path::component_name`
+* Use the `ChangeType` color scheme already defined
+* Show 1–2 lines of the component summary (if available)
+* Link dependencies using edges (even hardcoded for now)
+
+### 📌 Status: `Not Started`
+
+---
+
+## ✅ Step 2: Split Agent Prompts into Two Specialized Roles
+
+### 🌟 Objective:
+
+Replace the monolithic analysis prompt with two focused prompts:
+
+1. **Component Extractor**
+2. **Dependency Mapper**
+
+### 🔹 Definition of Done:
+
+You should be able to call each of these prompts independently and get JSON output conforming to a shared schema.
+
+### ⚡ Implementation Plan:
+
+* Create prompt templates (can live as Python strings or YAML files)
+* Use `openai.ChatCompletion.create` to run each prompt manually first
+* Define a shared `Component` schema with:
+
+  * `name`, `type`, `summary`, `dependencies`, `dependents`, `file_path`, `change_type`
+
+### 🔧 Implementation Details:
+
+* Component Extractor receives: file path + content + change type
+* Dependency Mapper receives: file path + list of components + code snippets
+* Each tool returns JSON with a list of `Component` objects
+* Validate that outputs can round-trip through `pydantic.BaseModel`
+
+### 📌 Status: `Not Started`
+
+---
+
+## ✅ Step 3: Add Chunking System for Large Files
+
+### 🌟 Objective:
+
+Break large files into chunks so component extraction doesn’t fail due to context limits.
+
+### 🔹 Definition of Done:
+
+The system should:
+
+* Automatically detect long files (>1000 lines or >10KB)
+* Split by top-level class or function boundaries
+* Pass each chunk individually to the Extractor agent
+
+### ⚡ Implementation Plan:
+
+* Use `tree-sitter` or regex to identify safe split points
+* Assign each chunk a metadata block:
+
+  * `chunk_id`, `start_line`, `end_line`, `file_path`, `text`
+* Feed each chunk separately into agent and recombine component outputs
+
+### 🔧 Implementation Details:
+
+* Store `ChunkResult` structs with raw outputs + parsed `Component` list
+* Keep a map of chunk → original file for traceability
+* If any chunk fails, include fallback: "Chunk X could not be parsed."
+
+### 📌 Status: `Not Started`
+
+---
+
+## ✅ Step 4: Set Up OpenAI Agents SDK Planner and Tools
+
+### 🌟 Objective:
+
+Create an orchestrator agent using the OpenAI Agents SDK that delegates to tools:
+
+* `extract_components`
+* `map_dependencies`
+* `visualize_graph`
+
+### 🔹 Definition of Done:
+
+A single `Runner.run()` call should:
+
+* Take the file list
+* Call tools in correct order
+* Generate a final graph and return it
+
+### ⚡ Implementation Plan:
+
+* Define 3 `Tool` subclasses
+* Define their input/output JSON schemas
+* Register these tools inside a `Planner` agent
+
+### 🔧 Implementation Details:
+
+* Use [`openai_agents.Tool`](https://openai.github.io/openai-agents-python/agents/#tools) class
+* Each tool’s `call()` should be fully stateless and log input/output
+* Store intermediate results in a `Workspace` or memory dict
+* Use the built-in `Planner` or implement a `ToolPicker`
+
+### 📌 Status: `Not Started`
+
+---
+
+## ✅ Step 5: Refactor Agent-Calling Logic in `ai_analysis.py`
+
+### 🌟 Objective:
+
+Replace direct prompt + parsing logic with calls to the OpenAI Agents SDK planner + tools.
+
+### 🔹 Definition of Done:
+
+`CodeAnalysisAgent.analyze_changes()` should:
+
+* Initialize planner
+* Submit file info + diffs to planner
+* Collect final graph (or summary)
+
+### ⚡ Implementation Plan:
+
+* Replace `_run_agent_analysis` with SDK planner call
+* Move all hardcoded prompt strings into reusable tools
+* Add detailed logging so developers can trace step-by-step agent execution
+
+### 🔧 Implementation Details:
+
+* Prepare `ToolContext` or `ToolMemory` between agent steps if needed
+* Use JSON logs for prompt/output snapshots to aid debugging
+* Ensure fallback mode (manual single-agent) works with `--legacy` flag
+
+### 📌 Status: `Not Started`
+
+---
+
+## ✅ Step 6: Plan for Future Multi-LLM Abstraction
+
+### 🌟 Objective:
+
+Lay the foundation for future support of Anthropic, Perplexity, Google Gemini, and OSS models.
+
+### 🔹 Definition of Done:
+
+Abstract out all LLM calls behind an `LLMProvider` interface.
+
+### ⚡ Implementation Plan:
+
+* Create `providers/` module
+* Start with `OpenAIProvider` (wraps OpenAI SDK + Agents SDK)
+* Define common interface: `.chat()`, `.tool_call()`, `.get_capabilities()`
+
+### 🔧 Implementation Details:
+
+* Use Python `ABC` or `Protocol`
+* Later: add `AnthropicProvider`, `OllamaProvider`, etc.
+* Allow tool definitions to work with different backends based on config or CLI flag
+
+### 📌 Status: `Not Started`
+
+---
+
+## 🏁 Final Deliverables Checklist
+
+* [ ] Component-level Mermaid output
+* [ ] Modular tool + planner agent pipeline
+* [ ] Chunked file handling with metadata
+* [ ] JSON-based schemas and round-trippable outputs
+* [ ] SDK-based execution with full logging
+* [ ] Abstracted backend for future multi-LLM provider support
diff --git a/Roadmap.md b/docs/Roadmap-v0-initialize.md
similarity index 100%
rename from Roadmap.md
rename to docs/Roadmap-v0-initialize.md

From b2450a4c65b9d57b43a3934ec7212cb52c1e6895 Mon Sep 17 00:00:00 2001
From: Avikalp Kumar Gupta <avikalpgupta@gmail.com>
Date: Sun, 8 Jun 2025 15:20:15 -0400
Subject: [PATCH 3/7] Refactor Mermaid diagram generation in GraphManager

- Updated file and component node styling to use lighter and darker shades respectively for better visual distinction.
- Removed redundant color mapping and replaced it with direct class definitions for file and component changes in the Mermaid diagram.
- In HTML report, Mermaid diagram is shown before change summary now.
---
 diffgraph/graph_manager.py | 38 +++++++++++++++-----------------------
 diffgraph/html_report.py   |  8 ++++----
 2 files changed, 19 insertions(+), 27 deletions(-)

diff --git a/diffgraph/graph_manager.py b/diffgraph/graph_manager.py
index f1628e7..bb9022f 100644
--- a/diffgraph/graph_manager.py
+++ b/diffgraph/graph_manager.py
@@ -144,46 +144,38 @@ def get_mermaid_diagram(self) -> str:
         """Generate a Mermaid diagram representation of the graph."""
         mermaid = ["graph TD"]
 
-        # Add file nodes with their change type colors
+        # Add file nodes with their change type colors (lighter shades)
         for file_path, node in self.file_nodes.items():
-            color = {
-                ChangeType.ADDED: "green",
-                ChangeType.DELETED: "red",
-                ChangeType.MODIFIED: "orange",
-                ChangeType.UNCHANGED: "gray"
-            }[node.change_type]
-
             label = f"{file_path}"
             if node.summary:
                 label += f"<br/>{node.summary[:50]}..."
             if node.error:
                 label += f"<br/>(Error: {node.error})"
 
-            mermaid.append(f'    {file_path.replace("/", "_")}["{label}"]:::change_{node.change_type.value}')
+            mermaid.append(f'    {file_path.replace("/", "_")}["{label}"]:::file_{node.change_type.value}')
 
-        # Add component nodes
+        # Add component nodes (darker shades)
         for component_id, node in self.component_nodes.items():
-            color = {
-                ChangeType.ADDED: "green",
-                ChangeType.DELETED: "red",
-                ChangeType.MODIFIED: "orange",
-                ChangeType.UNCHANGED: "gray"
-            }[node.change_type]
-
             label = f"{node.name}"
             if node.summary:
                 label += f"<br/>{node.summary[:50]}..."
 
-            mermaid.append(f'    {component_id.replace("/", "_").replace("::", "_")}["{label}"]:::change_{node.change_type.value}')
+            mermaid.append(f'    {component_id.replace("/", "_").replace("::", "_")}["{label}"]:::component_{node.change_type.value}')
 
         # Add edges between components
         for source, target in self.component_graph.edges():
             mermaid.append(f'    {source.replace("/", "_").replace("::", "_")} --> {target.replace("/", "_").replace("::", "_")}')
 
-        # Add style definitions
-        mermaid.append("    classDef change_added fill:green,stroke:#333,stroke-width:2px")
-        mermaid.append("    classDef change_deleted fill:red,stroke:#333,stroke-width:2px")
-        mermaid.append("    classDef change_modified fill:orange,stroke:#333,stroke-width:2px")
-        mermaid.append("    classDef change_unchanged fill:gray,stroke:#333,stroke-width:2px")
+        # Add style definitions for files (lighter shades)
+        mermaid.append("    classDef file_added fill:#90EE90,stroke:#333,stroke-width:2px")  # Light green
+        mermaid.append("    classDef file_deleted fill:#FFB6C1,stroke:#333,stroke-width:2px")  # Light red
+        mermaid.append("    classDef file_modified fill:#FFD580,stroke:#333,stroke-width:2px")  # Light orange
+        mermaid.append("    classDef file_unchanged fill:#D3D3D3,stroke:#333,stroke-width:2px")  # Light gray
+
+        # Add style definitions for components (darker shades)
+        mermaid.append("    classDef component_added fill:#32CD32,stroke:#333,stroke-width:2px")  # Lime green
+        mermaid.append("    classDef component_deleted fill:#DC143C,stroke:#333,stroke-width:2px")  # Crimson
+        mermaid.append("    classDef component_modified fill:#FF8C00,stroke:#333,stroke-width:2px")  # Dark orange
+        mermaid.append("    classDef component_unchanged fill:#808080,stroke:#333,stroke-width:2px")  # Gray
 
         return "\n".join(mermaid)
\ No newline at end of file
diff --git a/diffgraph/html_report.py b/diffgraph/html_report.py
index 2565473..5765024 100644
--- a/diffgraph/html_report.py
+++ b/diffgraph/html_report.py
@@ -147,6 +147,10 @@ def generate_html_report(analysis: AnalysisResult, output_path: str = "diffgraph
         <button class="theme-toggle" onclick="toggleTheme()">Toggle Dark Mode</button>
     </h1>
 
+    <div class="mermaid">
+        {mermaid_diagram}
+    </div>
+
     <div class="summary">
         <h2>Analysis Summary</h2>
         <div class="markdown-content" id="summary-content">
@@ -154,10 +158,6 @@ def generate_html_report(analysis: AnalysisResult, output_path: str = "diffgraph
         </div>
     </div>
 
-    <div class="mermaid">
-        {mermaid_diagram}
-    </div>
-
     <script>
         // Initialize Mermaid
         mermaid.initialize({{

From 83bff29ff985551f9f4cf6e33df98a68b74fcbb2 Mon Sep 17 00:00:00 2001
From: Avikalp Kumar Gupta <avikalpgupta@gmail.com>
Date: Sun, 8 Jun 2025 17:19:59 -0400
Subject: [PATCH 4/7] fix(diffgraph): Enhance CodeAnalysisAgent and
 GraphManager functionality

- Added regex-based parsing for component attributes in CodeAnalysisAgent to improve flexibility and robustness.
- Updated add_component method in GraphManager to handle summary, dependencies, and dependents more effectively, including cleanup of empty entries.
- Improved error handling during component processing to ensure invalid components are skipped without breaking the flow.
- Introduced tooltip functionality in HTML report for better user interaction with component nodes.
---
 diffgraph/ai_analysis.py   | 111 +++++++++++++++++++++----------------
 diffgraph/graph_manager.py |  76 ++++++++++++++++++-------
 diffgraph/html_report.py   |  57 +++++++++++++++++++
 3 files changed, 178 insertions(+), 66 deletions(-)

diff --git a/diffgraph/ai_analysis.py b/diffgraph/ai_analysis.py
index 3d028d0..8e900d7 100644
--- a/diffgraph/ai_analysis.py
+++ b/diffgraph/ai_analysis.py
@@ -6,6 +6,7 @@
 import time
 import random
 import openai
+import re
 
 class FileChange(BaseModel):
     """Model representing a file change."""
@@ -158,65 +159,81 @@ def analyze_changes(self, files_with_content: List[Dict[str, str]]) -> DiffAnaly
                 if "COMPONENTS:" in response_text:
                     components_section = response_text.split("COMPONENTS:")[1].split("IMPACT:")[0].strip()
                     current_component = {}
+                    components = []  # Reset components list for each file
 
                     for line in components_section.split("\n"):
                         line = line.strip()
                         if not line:
-                            if current_component:
+                            if current_component and "name" in current_component:  # Only add if we have a name
                                 components.append(current_component)
                                 current_component = {}
                             continue
 
-                        if line.startswith("- name:"):
-                            if current_component:
-                                components.append(current_component)
-                            current_component = {"name": line[7:].strip()}
-                        elif line.startswith("  type:"):
-                            current_component["type"] = line[7:].strip()
-                        elif line.startswith("  summary:"):
-                            current_component["summary"] = line[10:].strip()
-                        elif line.startswith("  dependencies:"):
-                            current_component["dependencies"] = [d.strip() for d in line[15:].split(",")]
-                        elif line.startswith("  dependents:"):
-                            current_component["dependents"] = [d.strip() for d in line[12:].split(",")]
-
-                    if current_component:
+                        parts = line.split(":")
+                        if len(parts) > 1:
+                            field_name = re.sub(r'[^a-zA-Z0-9_]', '', parts[0].strip()).lower()
+                            field_value = ":".join(parts[1:]).strip()
+                            if field_name == "name":
+                                if current_component and "name" in current_component:  # Only add if we have a name
+                                    components.append(current_component)
+                                current_component = {"name": field_value}
+                            elif field_name == "type":
+                                current_component["type"] = re.sub(r'[^a-zA-Z0-9_]', '', field_value.strip()).lower()
+                            elif field_name == "summary":
+                                current_component["summary"] = field_value
+                            elif field_name == "dependencies":
+                                current_component["dependencies"] = [d.strip() for d in field_value.split(",") if d.strip()]
+                            elif field_name == "dependents":
+                                current_component["dependents"] = [d.strip() for d in field_value.split(",") if d.strip()]
+
+                    if current_component and "name" in current_component:  # Only add if we have a name
                         components.append(current_component)
 
                 # Add components to the graph
                 for comp in components:
-                    change_type = ChangeType[comp["type"].upper()]
-                    self.graph_manager.add_component(
-                        comp["name"],
-                        current_file,
-                        change_type
-                    )
-
-                    # Add dependencies
-                    for dep in comp.get("dependencies", []):
-                        # Try to find the dependency in other components
-                        for other_comp in self.graph_manager.component_nodes.values():
-                            # More flexible matching - check if the dependency name is contained in the component name
-                            # or if the component name is contained in the dependency name
-                            if (dep.lower() in other_comp.name.lower() or
-                                other_comp.name.lower() in dep.lower()):
-                                self.graph_manager.add_component_dependency(
-                                    f"{current_file}::{comp['name']}",
-                                    f"{other_comp.file_path}::{other_comp.name}"
-                                )
-
-                    # Add dependents
-                    for dep in comp.get("dependents", []):
-                        # Try to find the dependent in other components
-                        for other_comp in self.graph_manager.component_nodes.values():
-                            # More flexible matching - check if the dependent name is contained in the component name
-                            # or if the component name is contained in the dependent name
-                            if (dep.lower() in other_comp.name.lower() or
-                                other_comp.name.lower() in dep.lower()):
-                                self.graph_manager.add_component_dependency(
-                                    f"{other_comp.file_path}::{other_comp.name}",
-                                    f"{current_file}::{comp['name']}"
-                                )
+                    if "name" not in comp or "type" not in comp:
+                        print(f"Skipping invalid component: {comp}")
+                        continue
+
+                    try:
+                        change_type = ChangeType[comp["type"].upper()]
+                        self.graph_manager.add_component(
+                            comp["name"],
+                            current_file,
+                            change_type,
+                            summary=comp.get("summary"),
+                            dependencies=comp.get("dependencies", []),
+                            dependents=comp.get("dependents", [])
+                        )
+
+                        # Add dependencies
+                        for dep in comp.get("dependencies", []):
+                            if not dep:  # Skip empty dependencies
+                                continue
+                            # Try to find the dependency in other components
+                            for other_comp in self.graph_manager.component_nodes.values():
+                                if (dep.lower() in other_comp.name.lower() or
+                                    other_comp.name.lower() in dep.lower()):
+                                    self.graph_manager.add_component_dependency(
+                                        f"{current_file}::{comp['name']}",
+                                        f"{other_comp.file_path}::{other_comp.name}"
+                                    )
+
+                        # Add dependents
+                        for dep in comp.get("dependents", []):
+                            if not dep:  # Skip empty dependents
+                                continue
+                            # Try to find the dependent in other components
+                            for other_comp in self.graph_manager.component_nodes.values():
+                                if (dep.lower() in other_comp.name.lower() or
+                                    other_comp.name.lower() in dep.lower()):
+                                    self.graph_manager.add_component_dependency(
+                                        f"{other_comp.file_path}::{other_comp.name}",
+                                        f"{current_file}::{comp['name']}"
+                                    )
+                    except Exception as e:
+                        print(f"Error processing component {comp.get('name', 'unknown')}: {str(e)}")
+                        continue
 
                 # Mark file as processed
                 self.graph_manager.mark_processed(current_file, summary, components)
diff --git a/diffgraph/graph_manager.py b/diffgraph/graph_manager.py
index bb9022f..cb72b02 100644
--- a/diffgraph/graph_manager.py
+++ b/diffgraph/graph_manager.py
@@ -70,23 +70,42 @@ def add_file(self, file_path: str, change_type: ChangeType) -> None:
             self.file_graph.add_node(file_path)
             self.processing_queue.append(file_path)
 
-    def add_component(self, name: str, file_path: str, change_type: ChangeType) -> None:
+    def add_component(self, name: str, file_path: str, change_type: ChangeType, summary: str = None, dependencies: list = None, dependents: list = None) -> None:
         """Add a new component to the graph."""
         component_id = f"{file_path}::{name}"
+        # Clean up dependencies and dependents lists
+        dependencies = [d for d in (dependencies or []) if d]
+        dependents = [d for d in (dependents or []) if d]
+
         if component_id not in self.component_nodes:
             self.component_nodes[component_id] = ComponentNode(
                 name=name,
                 file_path=file_path,
-                change_type=change_type
+                change_type=change_type,
+                summary=summary,
+                dependencies=dependencies,
+                dependents=dependents
             )
             self.component_graph.add_node(component_id)
+        else:
+            # Update existing component
+            existing = self.component_nodes[component_id]
+            existing.summary = summary or existing.summary
+            existing.dependencies = dependencies or existing.dependencies
+            existing.dependents = dependents or existing.dependents
 
     def add_component_dependency(self, source: str, target: str) -> None:
         """Add a dependency relationship between components."""
+        if not source or not target or source == target:
+            return
+
         if source in self.component_nodes and target in self.component_nodes:
-            self.component_graph.add_edge(source, target)
-            self.component_nodes[source].dependencies.append(target)
-            self.component_nodes[target].dependents.append(source)
+            if not self.component_graph.has_edge(source, target):
+                self.component_graph.add_edge(source, target)
+                if target not in self.component_nodes[source].dependencies:
+                    self.component_nodes[source].dependencies.append(target)
+                if source not in self.component_nodes[target].dependents:
+                    self.component_nodes[target].dependents.append(source)
 
     def get_next_file(self) -> Optional[str]:
         """Get the next file to process from the queue."""
@@ -144,23 +163,37 @@ def get_mermaid_diagram(self) -> str:
         """Generate a Mermaid diagram representation of the graph."""
         mermaid = ["graph TD"]
 
-        # Add file nodes with their change type colors (lighter shades)
-        for file_path, node in self.file_nodes.items():
-            label = f"{file_path}"
-            if node.summary:
-                label += f"<br/>{node.summary[:50]}..."
-            if node.error:
-                label += f"<br/>(Error: {node.error})"
+        file_classes = []
+        component_classes = []
 
-            mermaid.append(f'    {file_path.replace("/", "_")}["{label}"]:::file_{node.change_type.value}')
-
-        # Add component nodes (darker shades)
+        # Group components by their file paths
+        file_components = {}
         for component_id, node in self.component_nodes.items():
-            label = f"{node.name}"
-            if node.summary:
-                label += f"<br/>{node.summary[:50]}..."
+            if node.file_path not in file_components:
+                file_components[node.file_path] = []
+            file_components[node.file_path].append((component_id, node))
 
-            mermaid.append(f'    {component_id.replace("/", "_").replace("::", "_")}["{label}"]:::component_{node.change_type.value}')
+        # Add file nodes as subgraphs with their components inside
+        for file_path, node in self.file_nodes.items():
+            file_id = file_path.replace("/", "_")
+            file_label = file_path
+            if node.error:
+                file_label += f"<br/>(Error: {node.error})"
+            mermaid.append(f'    subgraph {file_id}["{file_label}"]')
+            mermaid.append(f'        direction TB')
+            file_classes.append(f'class {file_id} file_{node.change_type.value}')
+            # Add components within this file
+            if file_path in file_components:
+                for component_id, comp_node in file_components[file_path]:
+                    comp_id = component_id.replace("/", "_").replace("::", "_")
+                    component_label = comp_node.name
+                    if comp_node.summary:
+                        mermaid.append(f'        {comp_id}["{component_label}"]')
+                        component_classes.append(f'class {comp_id} component_{comp_node.change_type.value}')
+                    else:
+                        mermaid.append(f'        {comp_id}["{component_label}"]')
+                        component_classes.append(f'class {comp_id} component_{comp_node.change_type.value}')
+            mermaid.append('    end')
 
         # Add edges between components
         for source, target in self.component_graph.edges():
@@ -177,5 +210,10 @@ def get_mermaid_diagram(self) -> str:
         mermaid.append("    classDef component_deleted fill:#DC143C,stroke:#333,stroke-width:2px")  # Crimson
         mermaid.append("    classDef component_modified fill:#FF8C00,stroke:#333,stroke-width:2px")  # Dark orange
         mermaid.append("    classDef component_unchanged fill:#808080,stroke:#333,stroke-width:2px")  # Gray
+        mermaid.append("    classDef hidden fill:none,stroke:none")
+
+        # Add explicit class statements for files and components
+        mermaid.extend(file_classes)
+        mermaid.extend(component_classes)
 
         return "\n".join(mermaid)
\ No newline at end of file
diff --git a/diffgraph/html_report.py b/diffgraph/html_report.py
index 5765024..c68c20f 100644
--- a/diffgraph/html_report.py
+++ b/diffgraph/html_report.py
@@ -139,6 +139,24 @@ def generate_html_report(analysis: AnalysisResult, output_path: str = "diffgraph
             border-radius: 0.25rem;
             font-size: 0.875em;
         }}
+
+        /* Tooltip styles */
+        .tooltip {{
+            position: fixed;
+            background: var(--bg-secondary);
+            border: 1px solid var(--border-color);
+            border-radius: 0.5rem;
+            padding: 1rem;
+            max-width: 400px;
+            box-shadow: 0 4px 6px rgba(0, 0, 0, 0.1);
+            z-index: 1000;
+            display: none;
+            color: var(--text-primary);
+        }}
+
+        .tooltip.visible {{
+            display: block;
+        }}
     </style>
 </head>
 <body>
@@ -158,6 +176,9 @@ def generate_html_report(analysis: AnalysisResult, output_path: str = "diffgraph
         </div>
     </div>
 
+    <!-- Tooltip element -->
+    <div id="tooltip" class="tooltip"></div>
+
     <script>
         // Initialize Mermaid
         mermaid.initialize({{
@@ -202,6 +223,42 @@ def generate_html_report(analysis: AnalysisResult, output_path: str = "diffgraph
                 mermaid.init(undefined, el);
             }});
         }}
+
+        // Tooltip handling
+        window.showTooltip = function(text, event) {{
+            const tooltip = document.getElementById('tooltip');
+            tooltip.textContent = text;
+            tooltip.style.left = event.pageX + 10 + 'px';
+            tooltip.style.top = event.pageY + 10 + 'px';
+            tooltip.classList.add('visible');
+        }}
+
+        window.hideTooltip = function() {{
+            const tooltip = document.getElementById('tooltip');
+            tooltip.classList.remove('visible');
+        }}
+
+        // Add click handlers for component nodes
+        document.addEventListener('DOMContentLoaded', (event) => {{
+            document.querySelectorAll('.mermaid').forEach((el) => {{
+                el.addEventListener('click', (e) => {{
+                    const target = e.target;
+                    if (target.classList.contains('node')) {{
+                        const tooltip = target.getAttribute('data-tooltip');
+                        if (tooltip) {{
+                            showTooltip(tooltip, e);
+                        }}
+                    }}
+                }});
+            }});
+
+            // Hide tooltip when clicking outside
+            document.addEventListener('click', (e) => {{
+                if (!e.target.classList.contains('node')) {{
+                    hideTooltip();
+                }}
+            }});
+        }});
     </script>
 </body>
 </html>

From 47ae64d2dced0d8acb71ef1e26e87b298bb6ed87 Mon Sep 17 00:00:00 2001
From: Avikalp Kumar Gupta <avikalpgupta@gmail.com>
Date: Sun, 8 Jun 2025 19:17:22 -0400
Subject: [PATCH 5/7] refactor(diffgraph: graph_manager, html_report): Update
 Mermaid diagram generation and enhance tooltip functionality

- Changed Mermaid diagram orientation from TD to LR for better layout.
- Improved component ID handling using regex for cleaner formatting.
- Enhanced tooltip display in HTML report with markdown parsing and improved styling.
- Streamlined event handling for tooltip visibility and interaction with component nodes.
---
 diffgraph/graph_manager.py | 16 ++++++------
 diffgraph/html_report.py   | 53 ++++++++++++++++++++++----------------
 docs/Roadmap-v0-demo.md    |  6 ++---
 3 files changed, 42 insertions(+), 33 deletions(-)

diff --git a/diffgraph/graph_manager.py b/diffgraph/graph_manager.py
index cb72b02..5878427 100644
--- a/diffgraph/graph_manager.py
+++ b/diffgraph/graph_manager.py
@@ -2,6 +2,7 @@
 from dataclasses import dataclass
 from enum import Enum
 import networkx as nx
+import re
 
 class ChangeType(Enum):
     """Type of change in the code."""
@@ -161,7 +162,7 @@ def get_connected_components(self, start_component: str, max_depth: int = 3) ->
 
     def get_mermaid_diagram(self) -> str:
         """Generate a Mermaid diagram representation of the graph."""
-        mermaid = ["graph TD"]
+        mermaid = ["graph LR"]
 
         file_classes = []
         component_classes = []
@@ -185,19 +186,18 @@ def get_mermaid_diagram(self) -> str:
             # Add components within this file
             if file_path in file_components:
                 for component_id, comp_node in file_components[file_path]:
-                    comp_id = component_id.replace("/", "_").replace("::", "_")
-                    component_label = comp_node.name
+                    comp_id = re.sub(r'[^a-zA-Z0-9_]', '_', component_id)
+                    component_label = comp_node.name.replace('"', '\\"').replace('`', '\\`')
                     if comp_node.summary:
-                        mermaid.append(f'        {comp_id}["{component_label}"]')
-                        component_classes.append(f'class {comp_id} component_{comp_node.change_type.value}')
+                        mermaid.append(f'        {comp_id}["{component_label}"]:::component_{comp_node.change_type.value}')
+                        mermaid.append(f'        click {comp_id} call callback("{comp_node.summary.replace('"', '\\"')}") "{comp_node.summary.replace('"', '\\"')}"')
                     else:
-                        mermaid.append(f'        {comp_id}["{component_label}"]')
-                        component_classes.append(f'class {comp_id} component_{comp_node.change_type.value}')
+                        mermaid.append(f'        {comp_id}["{component_label}"]:::component_{comp_node.change_type.value}')
             mermaid.append('    end')
 
         # Add edges between components
         for source, target in self.component_graph.edges():
-            mermaid.append(f'    {source.replace("/", "_").replace("::", "_")} --> {target.replace("/", "_").replace("::", "_")}')
+            mermaid.append(f'    {re.sub(r'[^a-zA-Z0-9_]', '_', source)} --> {re.sub(r'[^a-zA-Z0-9_]', '_', target)}')
 
         # Add style definitions for files (lighter shades)
         mermaid.append("    classDef file_added fill:#90EE90,stroke:#333,stroke-width:2px")  # Light green
diff --git a/diffgraph/html_report.py b/diffgraph/html_report.py
index c68c20f..c0dc606 100644
--- a/diffgraph/html_report.py
+++ b/diffgraph/html_report.py
@@ -157,6 +157,21 @@ def generate_html_report(analysis: AnalysisResult, output_path: str = "diffgraph
         .tooltip.visible {{
             display: block;
         }}
+
+        .mermaidTooltip {{
+            position: absolute;
+            text-align: center;
+            max-width: 200px;
+            padding: 2px;
+            font-family: 'trebuchet ms', verdana, arial;
+            font-size: 12px;
+            background: #ffffde;
+            border: 1px solid #aaaa33;
+            border-radius: 2px;
+            pointer-events: none;
+            z-index: 100;
+        }}
+
     </style>
 </head>
 <body>
@@ -169,6 +184,8 @@ def generate_html_report(analysis: AnalysisResult, output_path: str = "diffgraph
         {mermaid_diagram}
     </div>
 
+    <div id="tooltip" class="tooltip"></div>
+
     <div class="summary">
         <h2>Analysis Summary</h2>
         <div class="markdown-content" id="summary-content">
@@ -176,9 +193,6 @@ def generate_html_report(analysis: AnalysisResult, output_path: str = "diffgraph
         </div>
     </div>
 
-    <!-- Tooltip element -->
-    <div id="tooltip" class="tooltip"></div>
-
     <script>
         // Initialize Mermaid
         mermaid.initialize({{
@@ -217,19 +231,21 @@ def generate_html_report(analysis: AnalysisResult, output_path: str = "diffgraph
             }});
 
             // Re-render Mermaid diagrams
-            document.querySelectorAll('.mermaid').forEach((el) => {{
+            document.querySelectorAll('.mermaid').forEach(async (el) => {{
                 const content = el.textContent;
                 el.textContent = content;
-                mermaid.init(undefined, el);
+                const {{ svg, bindFunctions }} = await mermaid.render('mermaid', content);
+                el.innerHTML = svg;
+                if (bindFunctions) {{
+                    bindFunctions(el);
+                }}
             }});
         }}
 
         // Tooltip handling
-        window.showTooltip = function(text, event) {{
+        window.showTooltip = function(text) {{
             const tooltip = document.getElementById('tooltip');
-            tooltip.textContent = text;
-            tooltip.style.left = event.pageX + 10 + 'px';
-            tooltip.style.top = event.pageY + 10 + 'px';
+            tooltip.innerHTML = marked.parse(text); // Parse markdown in tooltip
             tooltip.classList.add('visible');
         }}
 
@@ -238,23 +254,16 @@ def generate_html_report(analysis: AnalysisResult, output_path: str = "diffgraph
             tooltip.classList.remove('visible');
         }}
 
+        // Mermaid click callback
+        window.callback = function(text) {{
+            showTooltip(text);
+        }}
+
         // Add click handlers for component nodes
         document.addEventListener('DOMContentLoaded', (event) => {{
-            document.querySelectorAll('.mermaid').forEach((el) => {{
-                el.addEventListener('click', (e) => {{
-                    const target = e.target;
-                    if (target.classList.contains('node')) {{
-                        const tooltip = target.getAttribute('data-tooltip');
-                        if (tooltip) {{
-                            showTooltip(tooltip, e);
-                        }}
-                    }}
-                }});
-            }});
-
             // Hide tooltip when clicking outside
             document.addEventListener('click', (e) => {{
-                if (!e.target.classList.contains('node')) {{
+                if (!e.target.closest('.node')) {{
                     hideTooltip();
                 }}
             }});
diff --git a/docs/Roadmap-v0-demo.md b/docs/Roadmap-v0-demo.md
index 23ae2bf..5e0ffd9 100644
--- a/docs/Roadmap-v0-demo.md
+++ b/docs/Roadmap-v0-demo.md
@@ -33,7 +33,7 @@ The output HTML graph should show component nodes (e.g., `validateUser()`, `Auth
 * Show 1–2 lines of the component summary (if available)
 * Link dependencies using edges (even hardcoded for now)
 
-### 📌 Status: `Not Started`
+### 📌 Status: `Completed`
 
 ---
 
@@ -73,7 +73,7 @@ You should be able to call each of these prompts independently and get JSON outp
 
 ### 🌟 Objective:
 
-Break large files into chunks so component extraction doesn’t fail due to context limits.
+Break large files into chunks so component extraction doesn't fail due to context limits.
 
 ### 🔹 Definition of Done:
 
@@ -128,7 +128,7 @@ A single `Runner.run()` call should:
 ### 🔧 Implementation Details:
 
 * Use [`openai_agents.Tool`](https://openai.github.io/openai-agents-python/agents/#tools) class
-* Each tool’s `call()` should be fully stateless and log input/output
+* Each tool's `call()` should be fully stateless and log input/output
 * Store intermediate results in a `Workspace` or memory dict
 * Use the built-in `Planner` or implement a `ToolPicker`
 

From 78aeb6a6d3ce6b18707975e27d8a63a84e3e7ae4 Mon Sep 17 00:00:00 2001
From: Avikalp Kumar Gupta <avikalpgupta@gmail.com>
Date: Tue, 10 Jun 2025 14:48:02 -0400
Subject: [PATCH 6/7] Enhance exponential backoff retry logic in API calls

- Updated the retry decorator to utilize API rate limit information for more effective delay management.
- Implemented fallback mechanisms for delay calculation when 'retry_after' is not available.
- Added print statements to log response details during agent analysis execution for better debugging.
---
 diffgraph/ai_analysis.py | 20 +++++++++++++++++---
 1 file changed, 17 insertions(+), 3 deletions(-)

diff --git a/diffgraph/ai_analysis.py b/diffgraph/ai_analysis.py
index 8e900d7..c47ce16 100644
--- a/diffgraph/ai_analysis.py
+++ b/diffgraph/ai_analysis.py
@@ -20,7 +20,7 @@ class DiffAnalysis(BaseModel):
     mermaid_diagram: str
 
 def exponential_backoff_retry(func):
-    """Decorator to implement exponential backoff retry logic."""
+    """Decorator to implement exponential backoff retry logic using API rate limit information."""
     def wrapper(*args, **kwargs):
         max_retries = 5
         base_delay = 1  # Start with 1 second
@@ -33,8 +33,19 @@ def wrapper(*args, **kwargs):
                 if attempt == max_retries - 1:  # Last attempt
                     raise  # Re-raise the exception if all retries failed
 
-                # Calculate delay with exponential backoff and jitter
-                delay = min(base_delay * (2 ** attempt) + random.uniform(0, 1), max_delay)
+                # Try to get the retry delay from the error response
+                try:
+                    # The error response usually contains a 'retry_after' field
+                    retry_after = getattr(e, 'retry_after', None)
+                    if retry_after:
+                        delay = float(retry_after)
+                    else:
+                        # Fallback to exponential backoff if retry_after is not available
+                        delay = min(base_delay * (2 ** attempt) + random.uniform(0, 1), max_delay)
+                except (ValueError, TypeError):
+                    # If we can't parse the retry_after, fallback to exponential backoff
+                    delay = min(base_delay * (2 ** attempt) + random.uniform(0, 1), max_delay)
+
                 print(f"Rate limit hit. Retrying in {delay:.2f} seconds...")
                 time.sleep(delay)
             except Exception as e:
@@ -149,6 +160,9 @@ def analyze_changes(self, files_with_content: List[Dict[str, str]]) -> DiffAnaly
                 # Run the agent with retry logic
                 response_text = self._run_agent_analysis(prompt)
 
+                print("--------------------------------")
+                print(response_text)
+                print("--------------------------------")
                 # Parse the response
                 summary = ""
                 components = []

From c7f38de1d358bdeed8104ff3714a0a493bf483a1 Mon Sep 17 00:00:00 2001
From: Avikalp Kumar Gupta <avikalpgupta@gmail.com>
Date: Mon, 4 Aug 2025 18:32:56 +0530
Subject: [PATCH 7/7] minor: fixes suggested by CodeRabbit for improved
 reliability

- Updated graph_manager to use JSON for component summaries in Mermaid diagrams, enhancing data integrity.
- Simplified regex usage for component ID generation in graph edges for cleaner output.
- Modified html_report to ensure unique rendering IDs for Mermaid diagrams, preventing conflicts during re-rendering.
---
 diffgraph/graph_manager.py | 9 ++++++---
 diffgraph/html_report.py   | 5 +++--
 2 files changed, 9 insertions(+), 5 deletions(-)

diff --git a/diffgraph/graph_manager.py b/diffgraph/graph_manager.py
index 5878427..f51e799 100644
--- a/diffgraph/graph_manager.py
+++ b/diffgraph/graph_manager.py
@@ -2,7 +2,7 @@
 from dataclasses import dataclass
 from enum import Enum
 import networkx as nx
-import re
+import json, re
 
 class ChangeType(Enum):
     """Type of change in the code."""
@@ -189,15 +189,18 @@ def get_mermaid_diagram(self) -> str:
                     comp_id = re.sub(r'[^a-zA-Z0-9_]', '_', component_id)
                     component_label = comp_node.name.replace('"', '\\"').replace('`', '\\`')
                     if comp_node.summary:
+                        summary_txt = json.dumps(comp_node.summary)
                         mermaid.append(f'        {comp_id}["{component_label}"]:::component_{comp_node.change_type.value}')
-                        mermaid.append(f'        click {comp_id} call callback("{comp_node.summary.replace('"', '\\"')}") "{comp_node.summary.replace('"', '\\"')}"')
+                        mermaid.append(f'        click {comp_id} call callback("{summary_txt}") "{summary_txt}"')
                     else:
                         mermaid.append(f'        {comp_id}["{component_label}"]:::component_{comp_node.change_type.value}')
             mermaid.append('    end')
 
         # Add edges between components
         for source, target in self.component_graph.edges():
-            mermaid.append(f'    {re.sub(r'[^a-zA-Z0-9_]', '_', source)} --> {re.sub(r'[^a-zA-Z0-9_]', '_', target)}')
+            src_id = re.sub(r'[^a-zA-Z0-9_]', '_', source)
+            tgt_id = re.sub(r'[^a-zA-Z0-9_]', '_', target)
+            mermaid.append(f'    {src_id} --> {tgt_id}')
 
         # Add style definitions for files (lighter shades)
         mermaid.append("    classDef file_added fill:#90EE90,stroke:#333,stroke-width:2px")  # Light green
diff --git a/diffgraph/html_report.py b/diffgraph/html_report.py
index c0dc606..d619cd4 100644
--- a/diffgraph/html_report.py
+++ b/diffgraph/html_report.py
@@ -231,10 +231,11 @@ def generate_html_report(analysis: AnalysisResult, output_path: str = "diffgraph
             }});
 
             // Re-render Mermaid diagrams
-            document.querySelectorAll('.mermaid').forEach(async (el) => {{
+            document.querySelectorAll('.mermaid').forEach(async (el, idx) => {{
                 const content = el.textContent;
                 el.textContent = content;
-                const {{ svg, bindFunctions }} = await mermaid.render('mermaid', content);
+                const renderId = `mermaid-${idx}`;
+                const {{ svg, bindFunctions }} = await mermaid.render(renderId, content);
                 el.innerHTML = svg;
                 if (bindFunctions) {{
                     bindFunctions(el);