In [65]:
from langgraph.graph import StateGraph
from langgraph.graph import START,END
from typing import TypedDict,Annotated,List
from operator  import add
from pydantic import BaseModel,Field
import uuid

from langchain.chat_models import init_chat_model
model=init_chat_model("google_genai:models/gemini-flash-latest")


In [66]:
class Checkpoint(TypedDict):
    id:str
    name:str
    objective:str 

In [67]:


class State(TypedDict):
    report:str
    checkpoints:list[Checkpoint]

class CheckpointItem(BaseModel):
    name:str=Field(description="The name of the checkpoint")
    objective:str=Field(description="the specific objective of the checkpoint")

class CheckpointResponse(BaseModel):
    checkpoints:List[CheckpointItem]

model_with_structured_output=model.with_structured_output(CheckpointResponse)

In [68]:
def generate(state:State):
    report=state['report']
    response=model_with_structured_output.invoke(f"extract and breakdown this report{report} into learing checkponints")
    clean_checkpoints=[]
    for item in response.checkpoints:
        data=item.model_dump()
        data['id']=str(uuid.uuid4())
        clean_checkpoints.append(data)
    return {"checkpoint":clean_checkpoints}

In [69]:
builder=StateGraph(State)

builder.add_node("generate",generate)

builder.add_edge(START,"generate")
builder.add_edge("generate",END)
graph=builder.compile()

In [70]:
graph.invoke({"report":report_var})

{'report': " \n\n Here is the final report: # Comprehensive Comparison: Google Gemini vs. OpenAI Deep Research Agents (2025)      │\n│                                                                                                                 │\n│ ## Introduction                                                                                                 │\n│                                                                                                                 │\n│ This report provides a detailed, balanced comparison of Google’s Gemini AI suite and OpenAI’s Deep Research     │\n│ agents. Both technologies represent state-of-the-art advancements in artificial intelligence but are designed   │\n│ with distinct architectures, capabilities, use cases, and integration models. This analysis examines key        │\n│ aspects such as core features, intended applications, underlying technologies, performance benchmarks,          │\n│ integration options, and notable strengths and

In [72]:
report_var=""" 

 Here is the final report: # Comprehensive Comparison: Google Gemini vs. OpenAI Deep Research Agents (2025)      │
│                                                                                                                 │
│ ## Introduction                                                                                                 │
│                                                                                                                 │
│ This report provides a detailed, balanced comparison of Google’s Gemini AI suite and OpenAI’s Deep Research     │
│ agents. Both technologies represent state-of-the-art advancements in artificial intelligence but are designed   │
│ with distinct architectures, capabilities, use cases, and integration models. This analysis examines key        │
│ aspects such as core features, intended applications, underlying technologies, performance benchmarks,          │
│ integration options, and notable strengths and weaknesses, referencing the latest information and official      │
│ documentation as of August 2025.                                                                                │
│                                                                                                                 │
│ ---                                                                                                             │
│                                                                                                                 │
│ ## Overview: Google Gemini                                                                                      │
│                                                                                                                 │
│ ### Core Capabilities                                                                                           │
│                                                                                                                 │
│ - **Multimodality**: Gemini supports native processing of text, images, video, audio, code, and PDF inputs, and │
│ can generate outputs in text, audio, and structured data formats. Recent iterations, such as Gemini 2.5 Deep    │
│ Think, can handle context windows exceeding 1 million tokens and output up to 192,000 tokens, enabling the      │
│ processing of vast and complex documents or media streams.                                                      │
│ - **Advanced Reasoning**: The “Deep Think” and Pro variants deploy parallel hypothesis testing and              │
│ reinforcement learning, excelling at coding, complex mathematical reasoning, multimodal understanding,          │
│ structured outputs, and function/tool calling.                                                                  │
│ - **Agentic Capabilities**: Gemini powers research agents and universal AI assistants (e.g., Project Astra,     │
│ Project Mariner), handling autonomous workflows like code debugging, real-time information retrieval, and       │
│ interactive web task completion.                                                                                │
│ - **Safety and Governance**: Gemini employs extensive safety measures, including red teaming (automated and     │
│ external), multi-tiered abuse monitoring, mitigations against sensitive domains (e.g., chemical/biological),    │
│ and oversight by Google DeepMind’s Responsibility and Safety Council. It adheres to ethical principles such as  │
│ minimization of bias and toxicity.                                                                              │
│                                                                                                                 │
│ ### Intended Use Cases                                                                                          │
│                                                                                                                 │
│ - Complex knowledge work (e.g., scientific research, coding assistants, market analysis)                        │
│ - Large-scale document analysis, summarization, and synthesis                                                   │
│ - Content creation across text, image, video (e.g., AI-powered design, video generation with Veo, music with    │
│ Lyria)                                                                                                          │
│ - Autonomous agents for enterprise workflows (e.g., web research, spreadsheet automation, technical support,    │
│ creative design)                                                                                                │
│ - Integration into Google products and services: Workspace (Docs, Sheets, Slides), Pixel devices, Search, Ads,  │
│ Chrome, and Duet AI                                                                                             │
│                                                                                                                 │
│ ### Underlying Technologies and Architecture                                                                    │
│                                                                                                                 │
│ - **Sparse Mixture-of-Experts (MoE) Transformers**: Efficiently routes token streams to specialist “experts,”   │
│ scaling model power and reducing unnecessary computation compared to dense models.                              │
│ - **Training Infrastructure**: Built and scaled atop Google’s custom Tensor Processing Units (TPUs), notably    │
│ the latest Trillium and v5p generations, offering high energy efficiency and throughput.                        │
│ - **Data and Multimodal Alignment**: Gemini models are instruction-tuned on diverse datasets spanning internet  │
│ text, code, multimodal data, and human tool-use demonstrations, with additional reinforcement from human and AI │
│ feedback loops.                                                                                                 │
│ - **Agentic Systems**: Gemini integrates tool use (code execution, search), rapid context expansion (handling   │
│ very large documents), and interaction with third-party tools through its APIs.                                 │
│                                                                                                                 │
│ ### Performance Benchmarks                                                                                      │
│                                                                                                                 │
│ - **Academic and Coding Tasks**:                                                                                │
│   - Outperformed humans on MMLU (90.0% - Gemini Ultra) and competes at IMO (mathematics competition) Bronze     │
│ level (60.7%).                                                                                                  │
│   - Achieves strong results on coding (LiveCodeBench 87.6%), knowledge, and reasoning benchmarks.               │
│ - **Agentic Tasks**:                                                                                            │
│   - Project Mariner and Gemini Plays Pokémon showcase advanced planning, tool use, and context management,      │
│ e.g., completing Pokémon Blue autonomously after hundreds of hours.                                             │
│ - **Comparative Edge**:                                                                                         │
│   - Gemini is recognized for high factual accuracy, extremely large context windows, and rapid processing,      │
│ especially for multimodal or large-scale tasks.                                                                 │
│                                                                                                                 │
│ ### Integration Options                                                                                         │
│                                                                                                                 │
│ - **APIs**: Accessible via Google AI Studio, Vertex AI (for cloud deployment), and dedicated APIs (REST, SDKs   │
│ in various languages).                                                                                          │
│ - **Product Deep Integration**: Gemini is foundational to Workspace tools, Pixel on-device AI, Search Labs' AI  │
│ Overviews, and Duet AI for enterprise productivity.                                                             │
│ - **Developer Ecosystem**: Offers Model Garden for testing/deployment, detailed rate limits with scalable       │
│ quotas, batch mode support for cost efficiency, and transparent, usage-based pricing.                           │
│ - **Fine-tuning & Customization**: Support for model customization and domain-specific tasks, with facilities   │
│ for prompt engineering, tool chaining, and safe deployment monitoring.                                          │
│                                                                                                                 │
│ ### Notable Strengths and Weaknesses                                                                            │
│                                                                                                                 │
│ **Strengths**                                                                                                   │
│ - Broad and deep multimodality with vast context (1M+ tokens)                                                   │
│ - High-speed inference for large, complex workflows                                                             │
│ - Deep integration across Google’s ecosystem and developer tools                                                │
│ - Industry-leading benchmarking on factual, reasoning, and coding tasks                                         │
│ - Advanced safety governance                                                                                    │
│                                                                                                                 │
│ **Weaknesses**                                                                                                  │
│ - Some known issues with hallucination and occasional latency, particularly at the highest computation tiers    │
│ - Over-refusal of benign queries due to conservative safety layers                                              │
│ - Earlier access to specialized features (e.g., newest model variants) may be gated or subject to usage         │
│ restrictions                                                                                                    │
│ - Premium enterprise pricing for advanced models and batch processing                                           │
│                                                                                                                 │
│ [1][2][3][4][5][6][7][8][9][10][11][12]                                                                         │
│                                                                                                                 │
│ ---                                                                                                             │
│                                                                                                                 │
│ ## Overview: OpenAI Deep Research Agents                                                                        │
│                                                                                                                 │
│ ### Core Capabilities                                                                                           │
│                                                                                                                 │
│ - **Autonomous Multi-Step Research**: Deep Research agents can independently plan, browse the real-time         │
│ internet, analyze hundreds of resources (websites, PDFs, images, structured files), synthesize findings, and    │
│ generate comprehensive, citation-backed research reports. Transparency is emphasized through step-by-step       │
│ action logs and in-line source attribution.                                                                     │
│ - **Agentic Reasoning & Workflow Automation**: Empowers users to delegate entire research projects, from web    │
│ data collection to report writing, planning, and visualization. The newly launched ChatGPT Agent combines these │
│ capabilities with code execution, web automation, and third-party tool integration (e.g., creating              │
│ presentations or spreadsheets).                                                                                 │
│ - **Citations & Analytical Traceability**: For every decisive step, Deep Research logs tools invoked (web       │
│ search, code interpreters, Model Context Protocol connectors), building a traceable reasoning chain akin to an  │
│ expert analyst’s workflow.                                                                                      │
│ - **Safety & User Control**: Implements explicit user approval for consequential actions, privacy/sandboxing    │
│ for sensitive tasks, and comprehensive risk mitigations, including prompt-injection and data exfiltration       │
│ defenses.                                                                                                       │
│                                                                                                                 │
│ ### Intended Use Cases                                                                                          │
│                                                                                                                 │
│ - In-depth market, policy, technical, or literature research requiring source-backed synthesis                  │
│ - Competitive intelligence, product comparison, and strategy reports                                            │
│ - Automated health economics analysis, regulatory compliance checks, and legal research                         │
│ - Spreadsheet automation, technical reporting, real-time trend and news aggregation                             │
│ - Enterprise integrations (Gmail, GitHub, financial modeling) and advanced agentic workflows                    │
│                                                                                                                 │
│ ### Underlying Technologies and Architecture                                                                    │
│                                                                                                                 │
│ - **Large-scale Reasoning Models**: Deep Research leverages optimized variants of OpenAI’s o3 and forthcoming   │
│ o4 models, which are highly agentic, employing transformer backbones enhanced by real-world tool-use learning   │
│ and advanced browsing capabilities.                                                                             │
│ - **Reinforcement Learning on Real Tasks**: Trained through reinforcement learning on real                      │
│ browser/Python/coding tasks, with extensive multi-modal alignment and reasoning fine-tuning.                    │
│ - **API Design**: Exposes research as an asynchronous background job, returning final structured reports with   │
│ detailed logs; supports tool integrations (web search, code interpreter, Model Context Protocol servers for     │
│ internal data research).                                                                                        │
│ - **Privacy and Safety by Design**: Restricts certain actions, logs all tool usage, requires trusted            │
│ connectors, and enforces separation of sensitive data workflows.                                                │
│                                                                                                                 │
│ ### Performance Benchmarks                                                                                      │
│                                                                                                                 │
│ - **Academic and Research Benchmarks**:                                                                         │
│   - State-of-the-art on Humanity’s Last Exam (26.6% - o3; new pass@1 of 41.6 for unified ChatGPT agent) and     │
│ GAIA (average accuracy of 72.6%).                                                                               │
│   - Well-suited for complex, multi-modal queries requiring synthesis across external and internal data.         │
│ - **Analyst-Level Workflows**:                                                                                  │
│   - Domain experts consistently rate Deep Research as automating multiple hours of challenging research per     │
│ successful query.                                                                                               │
│ - **Comparative Findings**:                                                                                     │
│   - Outperforms competitors (e.g., Gemini, DeepSeek, Perplexity) on multi-step analytic depth, citation         │
│ adherence, and complex chain-of-thought queries, albeit at higher cost and slower speeds.                       │
│                                                                                                                 │
│ ### Integration Options                                                                                         │
│                                                                                                                 │
│ - **ChatGPT Interface**: Accessible through ChatGPT’s web and desktop/mobile apps by selecting “Deep Research”  │
│ in message composition.                                                                                         │
│ - **API (Responses/Deep Research API)**: For developers, supports advanced integrations, automation, and tool   │
│ chaining, including the specification of custom data connectors and prompt rewriters.                           │
│ - **Connectors & Third-Party Apps**: Proactive workflow automation via connectors to Gmail, GitHub, and         │
│ enterprise suites, with sandboxed and permissioned real-world actions via the ChatGPT Agent.                    │
│ - **Pricing & Rate Limits**: Currently available to Pro, Plus, Team, and Enterprise users, with expansion to    │
│ the Free tier planned. The service is compute-intensive and billed at a premium (approx. $200/month), with      │
│ lower-latency variants and higher rate limits in development.                                                   │
│                                                                                                                 │
│ ### Notable Strengths and Weaknesses                                                                            │
│                                                                                                                 │
│ **Strengths**                                                                                                   │
│ - Highest depth for source-rich, well-cited analytic research                                                   │
│ - Iterative refinement and “human assistant” transparency in reasoning and decision logging                     │
│ - Unified agentic system bridges complex research, web automation, and coding actions                           │
│ - Robust safety (control over actions, explicit approvals, privacy isolation)                                   │
│ - Broad integration, especially for knowledge-intensive and enterprise research tasks                           │
│                                                                                                                 │
│ **Weaknesses**                                                                                                  │
│ - Processing time per research job (5–30 minutes) is substantially higher than general-purpose LLM outputs      │
│ - Cost is significantly higher than competitors for in-depth research                                           │
│ - Occasional hallucinations, confidence calibration issues, and variable output formatting                      │
│ - Research is most effective with fully-specified, well-formed prompts (API expects little to no clarification) │
│                                                                                                                 │
│ [1][2][3][5][6][7][8]                                                                                           │
│                                                                                                                 │
│ ---                                                                                                             │
│                                                                                                                 │
│ ## Comparative Analysis                                                                                         │
│                                                                                                                 │
│ ### Core Capabilities and Use Case Specialization                                                               │
│                                                                                                                 │
│ - **Gemini** excels as a general-purpose multimodal platform, rapidly handling diverse inputs (including        │
│ extremely long texts, images, video, and audio) with strong reasoning and large context support. Its agentic    │
│ variants (2.5 Deep Think) enable advanced planning and autonomy in complex workflows.                           │
│ - **Deep Research** is focused on deep, source-cited analytic synthesis—essentially automating the high-end     │
│ research analyst’s workflow with maximal coverage, transparency, and reasoning traceability. Its agentic        │
│ strengths shine in chaining multi-step queries, executing code, and integrating findings across disparate       │
│ domains.                                                                                                        │
│                                                                                                                 │
│ ### Architecture and Model Design                                                                               │
│                                                                                                                 │
│ - **Gemini** is built on sparse Mixture-of-Experts architecture for scalability and efficiency, and is natively │
│ multimodal from the ground up. It is deeply embedded in Google’s infrastructure (TPUs, Workspace, Pixel).       │
│ - **Deep Research** layers agentic reasoning atop advanced transformer backbones (optimized o3/o4), employs     │
│ reinforcement learning on tool-use tasks, and exposes fine-grained control and visibility via OpenAI’s API.     │
│                                                                                                                 │
│ ### Performance and Benchmarking                                                                                │
│                                                                                                                 │
│ - **Gemini** has benchmark leadership in large context, speed, and multimodal deployments (e.g., hours of       │
│ video, complex coding, factual QA), and generally edges out competitors for tasks blending modality and context │
│ length.                                                                                                         │
│ - **Deep Research** leads on traditional research metrics—multi-step logical synthesis, depth of citation, and  │
│ analyst-level report creation—as reflected in domain expert evaluations and results on reasoning-heavy          │
│ benchmarks (Humanity’s Last Exam, GAIA).                                                                        │
│ - **Caveat on Benchmarks**: Both Google and OpenAI acknowledge the limitations of current benchmarks, with      │
│ issues around dataset validity, saturation, and safety signaling. Users should regard reported scores as        │
│ indicative but not absolute measures of real-world performance ([9]).                                           │
│                                                                                                                 │
│ ### Integration and Ecosystem                                                                                   │
│                                                                                                                 │
│ - **Gemini** is highly accessible for developers and enterprises, offering mature APIs, Workspace integrations, │
│ and ready deployment via Vertex AI with transparent pricing and extensive documentation. It supports            │
│ fine-tuning, customization, and flexible deployment models (cloud, on-device).                                  │
│ - **Deep Research** is primarily available in ChatGPT and as an API for advanced developer use. Its workflow    │
│ capabilities are exposed via OpenAI's agent platform (ChatGPT Agent) and connectors, focusing on                │
│ knowledge-intensive enterprise environments and technical research.                                             │
│                                                                                                                 │
│ ### Cost, Access, and Scalability                                                                               │
│                                                                                                                 │
│ - **Gemini** offers broader cost tiers (including accessible entry points and enterprise pricing) and generous  │
│ free/developer access for basic use. Batch processing and context caching are available at reduced rates for    │
│ large-volume research.                                                                                          │
│ - **Deep Research** is positioned as a premium solution, with higher per-query costs and longer compute times.  │
│ Rollout to broader user tiers and cost-optimized models is in progress.                                         │
│                                                                                                                 │
│ ### Strengths and Weaknesses Overview                                                                           │
│                                                                                                                 │
│ |                  | Google Gemini                                         | OpenAI Deep Research               │
│ |                                                                                                               │
│ |------------------|------------------------------------------------------|------------------------------------ │
│ ------|                                                                                                         │
│ | **Strengths**    | - Largest context, multimodal integration<br>- Speed, deep Google product integration<br>- │
│ Strong factual accuracy and enterprise scalability<br>- Comprehensive safety governance | - Unmatched depth in  │
│ citation-rich, analytic synthesis<br>- Transparent, step-wise reasoning & action logs<br>- Agentic research     │
│ merges web/data/code tools<br>- Enterprise/analyst automation excellence     |                                  │
│ | **Weaknesses**   | - Occasional slowdowns at scale<br>- Over-refusal conservatism <br>- Some feature          │
│ gating<br>- Top-tier pricing for advanced models | - High cost, slow processing per job<br>-                    │
│ Hallucinations/confidence issues<br>- Prompts must be highly specific<br>- Format/UX issues in some outputs     │
│ |                                                                                                               │
│                                                                                                                 │
│ ---                                                                                                             │
│                                                                                                                 │
│ ## Conclusion                                                                                                   │
│                                                                                                                 │
│ Google Gemini and OpenAI’s Deep Research agents, while both representing the cutting edge of AI, are tailored   │
│ to different segments of the knowledge-work and agent automation spectrum:                                      │
│                                                                                                                 │
│ - **Use Gemini** if you require fast, scalable, multimodal reasoning and content generation, integration with   │
│ Google’s suite of tools, support for massive context windows, and broad developer deployment.                   │
│ - **Use Deep Research** when you need the highest level of analytic synthesis, traceability, and source-backed  │
│ reporting—essential for research analysts, legal/technical experts, and enterprises that require auditable,     │
│ multi-step automation and actionability.                                                                        │
│                                                                                                                 │
│ Both platforms are converging towards more capable agentic AI, integrating multi-step reasoning, workflow       │
│ automation, and external tool use. User choice should be guided by the project’s required depth, speed,         │
│ modality, integration needs, and budget constraints.                                                            │
│                                                                                                                 │
│ ---                                                                                                             │
│                                                                                                                 │
│ ## Sources                                                                                                      │
│                                                                                                                 │
│ 1. [Gemini models | Gemini API | Google AI for Developers](https://ai.google.dev/gemini-api/docs/models)        │
│ 2. [Introducing Gemini: our largest and most capable AI                                                         │
│ model](https://blog.google/technology/ai/google-gemini-ai/)                                                     │
│ 3. [Google models | Generative AI on Vertex AI](https://cloud.google.com/vertex-ai/generative-ai/docs/models)   │
│ 4. [Gemini 2.5 Deep Think - Model Card -                                                                        │
│ Googleapis.com](https://storage.googleapis.com/deepmind-media/Model-Cards/Gemini-2-5-Deep-Think-Model-Card.pdf) │
│ 5. [Introducing Gemini 2.0: our new AI model for the agentic                                                    │
│ era](https://blog.google/technology/google-deepmind/google-gemini-ai-update-december-2024/)                     │
│ 6. [Gemini 2.5: Pushing the Frontier with Advanced Reasoning                                                    │
│ ...](https://storage.googleapis.com/deepmind-media/gemini/gemini_v2_5_report.pdf)                               │
│ 7. [Comparing Google Gemini and ChatGPT: API Keys, Costs &                                                      │
│ Access](https://newo.ai/insights/google-gemini-vs-chatgpt-a-comprehensive-api-comparison/)                      │
│ 8. [ChatGPT vs Claude vs Gemini: Full Report and Comparison of                                                  │
│ ...](https://www.datastudios.org/post/chatgpt-vs-claude-vs-gemini-full-report-and-comparison-of-features-perfor │
│ mance-integrations-pric)                                                                                        │
│ 9. [ChatGPT vs Claude vs Gemini: The Best AI Model for Each Use                                                 │
│ ...](https://creatoreconomy.so/p/chatgpt-vs-claude-vs-gemini-the-best-ai-model-for-each-use-case-2025)          │
│ 10. [Rate limits | Gemini API | Google AI for Developers](https://ai.google.dev/gemini-api/docs/rate-limits)    │
│ 11. [Gemini Developer API Pricing | Gemini API | Google AI for                                                  │
│ Developers](https://ai.google.dev/gemini-api/docs/pricing)                                                      │
│ 12. [Vertex AI Pricing | Generative AI on Vertex AI - Google                                                    │
│ Cloud](https://cloud.google.com/vertex-ai/generative-ai/pricing)                                                │
│ 13. [Introducing deep research - OpenAI](https://openai.com/index/introducing-deep-research/)                   │
│ 14. [Introducing ChatGPT agent: bridging research and action -                                                  │
│ OpenAI](https://openai.com/index/introducing-chatgpt-agent/)                                                    │
│ 15. [OpenAI's Deep Research Tool: A Comprehensive                                                               │
│ Overview](https://bytebridge.medium.com/openais-deep-research-tool-a-comprehensive-overview-12ddab43feff)       │
│ 16. [Deep research - OpenAI API](https://platform.openai.com/docs/guides/deep-research)                         │
│ 17. [Introduction to deep research in the OpenAI                                                                │
│ API](https://cookbook.openai.com/examples/deep_research_api/introduction_to_deep_research_api)                  │
│ 18. [OpenAI Deep Research vs. Google Deep Research - AI                                                         │
│ Supremacy](https://www.ai-supremacy.com/p/openai-deep-research-vs-google-deep)                                  │
│ 19. [OpenAI Deep Research: How it Compares to Perplexity and                                                    │
│ Gemini](https://www.helicone.ai/blog/openai-deep-research)                                                      │
│ 20. [Can We Trust AI Benchmarks? An Interdisciplinary Review of ... -                                           │
│ arXiv](https://arxiv.org/html/2502.06559v2)

 """

In [73]:
import uuid
from typing import TypedDict, List
from langgraph.graph import StateGraph, START, END
from pydantic import BaseModel, Field
from langchain.chat_models import init_chat_model

# Initialize Model
model = init_chat_model("google_genai:models/gemini-flash-latest")

# --- 1. TypedDicts (The Internal Memory) ---
class Checkpoint(TypedDict):
    id: str
    name: str
    objective: str  # Matches Pydantic field below

class State(TypedDict):
    report: str
    checkpoints: list[Checkpoint]

# --- 2. Pydantic Models (The LLM Interface) ---
class CheckpointItem(BaseModel):
    name: str = Field(description="The name of the checkpoint")
    objective: str = Field(description="the specific objective of the checkpoint") # FIXED: typo 'objetive' -> 'objective'

class CheckpointResponse(BaseModel):
    checkpoints: List[CheckpointItem]

# Setup LLM
model_with_structured_output = model.with_structured_output(CheckpointResponse)

# --- 3. The Node ---
def generate(state: State):
    report = state['report']
    
    # Fixed variable name spelling
    response = model_with_structured_output.invoke(f"extract and breakdown this report {report} into learning checkpoints")
    
    clean_checkpoints = []
    for item in response.checkpoints:
        data = item.model_dump()
        
        # Inject ID
        data['id'] = str(uuid.uuid4())
        
        clean_checkpoints.append(data)
    
    # FIXED: Key must match State definition exactly ("checkpoints")
    return {"checkpoints": clean_checkpoints} 

# --- 4. Build Graph ---
builder = StateGraph(State)
builder.add_node("generate", generate)
builder.add_edge(START, "generate")
builder.add_edge("generate", END)

graph = builder.compile()

# --- 5. Run ---
# Define the variable first
# report_var = "This is a report about learning Python." 
result = graph.invoke({"report": report_var})

print(result)

{'report': " \n\n Here is the final report: # Comprehensive Comparison: Google Gemini vs. OpenAI Deep Research Agents (2025)      │\n│                                                                                                                 │\n│ ## Introduction                                                                                                 │\n│                                                                                                                 │\n│ This report provides a detailed, balanced comparison of Google’s Gemini AI suite and OpenAI’s Deep Research     │\n│ agents. Both technologies represent state-of-the-art advancements in artificial intelligence but are designed   │\n│ with distinct architectures, capabilities, use cases, and integration models. This analysis examines key        │\n│ aspects such as core features, intended applications, underlying technologies, performance benchmarks,          │\n│ integration options, and notable strengths and

In [74]:
result

{'report': " \n\n Here is the final report: # Comprehensive Comparison: Google Gemini vs. OpenAI Deep Research Agents (2025)      │\n│                                                                                                                 │\n│ ## Introduction                                                                                                 │\n│                                                                                                                 │\n│ This report provides a detailed, balanced comparison of Google’s Gemini AI suite and OpenAI’s Deep Research     │\n│ agents. Both technologies represent state-of-the-art advancements in artificial intelligence but are designed   │\n│ with distinct architectures, capabilities, use cases, and integration models. This analysis examines key        │\n│ aspects such as core features, intended applications, underlying technologies, performance benchmarks,          │\n│ integration options, and notable strengths and