langchain-ai · jacoblee93 · Nov 9, 2023 · Nov 9, 2023 · Nov 9, 2023 · Nov 9, 2023
diff --git a/docs/docs/modules/agents/agent_types/openai_functions_agent.mdx b/docs/docs/modules/agents/agent_types/openai_functions_agent.mdx
@@ -5,7 +5,7 @@ sidebar_position: 0
 
 # OpenAI functions
 
-Certain OpenAI models (like `gpt-3.5-turbo` and `gpt-4`) have been fine-tuned to detect when a function should to be called and respond with the inputs that should be passed to the function.
+Certain OpenAI models (like `gpt-3.5-turbo` and `gpt-4`) have been fine-tuned to detect when a function should be called and respond with the inputs that should be passed to the function.
 In an API call, you can describe functions and have the model intelligently choose to output a JSON object containing arguments to call those functions.
 The goal of the OpenAI Function APIs is to more reliably return valid and useful function calls than a generic text completion or chat API.
 
@@ -22,7 +22,7 @@ Must be used with an [OpenAI Functions](https://platform.openai.com/docs/guides/
 
 # With LCEL
 
-In this example we'll use LCEL to construct a highly customizable agent that is given two tools: search and calculator.
+In this example we'll use LCEL to construct a customizable agent that is given two tools: search and calculator.
 We'll then pull in a prompt template from the [LangChainHub](https://smith.langchain.com/hub) and pass that to our runnable agent.
 Lastly we'll use the default OpenAI functions output parser `OpenAIFunctionsAgentOutputParser`.
 This output parser contains a method `parseAIMessage` which when provided with a message, either returns an instance of `FunctionsAgentAction` if there is another action to be taken my the agent, or `AgentFinish` if the agent has completed its objective.

diff --git a/docs/docs/modules/agents/agent_types/openai_tools_agent.mdx b/docs/docs/modules/agents/agent_types/openai_tools_agent.mdx
@@ -0,0 +1,131 @@
+---
+hide_table_of_contents: true
+sidebar_position: 1
+---
+
+# OpenAI tool calling
+
+:::tip Compatibility
+Tool calling is new and only available on [OpenAI's latest models](https://platform.openai.com/docs/guides/function-calling).
+:::
+
+OpenAI's latest `gpt-3.5-turbo-1106` and `gpt-4-1106-preview` models have been fine-tuned to detect when one or more tools should be called to gather sufficient information
+to answer the initial query, and respond with the inputs that should be passed to those tools.
+
+While the goal of more reliably returning valid and useful function calls is the same as the functions agent, the ability to return multiple tools at once results in
+both fewer roundtrips for complex questions.
+
+The OpenAI Tools Agent is designed to work with these models.
+
+import CodeBlock from "@theme/CodeBlock";
+import RunnableExample from "@examples/agents/openai_tools_runnable.ts";
+
+# Usage
+
+In this example we'll use LCEL to construct a customizable agent with a mocked weather tool and a calculator.
+
+The basic flow is this:
+
+1. Define the tools the agent will be able to call. You can use [OpenAI's tool syntax](https://platform.openai.com/docs/guides/function-calling), or LangChain tool instances as shown below.
+2. Initialize our model and bind those tools as arguments.
+3. Define a function that formats any previous agent steps as messages. The agent will pass those back to OpenAI for the next agent iteration.
+4. Create a `RunnableSequence` that will act as the agent. We use a specialized output parser to extract any tool calls from the model's output.
+5. Initialize an `AgentExecutor` with the agent and the tools to execute the agent on a loop.
+6. Run the `AgentExecutor` and see the output.
+
+Here's how it looks:
+
+<CodeBlock language="typescript">{RunnableExample}</CodeBlock>
+
+You can check out this example trace for an inspectable view of the steps taken to answer the question: https://smith.langchain.com/public/2bbffb7d-4f9d-47ad-90be-09910e5b4b34/r
+
+## Adding memory
+
+We can also use memory to save our previous agent input/outputs, and pass it through to each agent iteration.
+Using memory can help give the agent better context on past interactions, which can lead to more accurate responses beyond what the `agent_scratchpad` can do.
+
+Adding memory only requires a few changes to the above example.
+
+First, import and instantiate your memory class, in this example we'll use `BufferMemory`.
+
+```typescript
+import { BufferMemory } from "langchain/memory";
+```
+
+```typescript
+const memory = new BufferMemory({
+  memoryKey: "history", // The object key to store the memory under
+  inputKey: "question", // The object key for the input
+  outputKey: "answer", // The object key for the output
+  returnMessages: true,
+});
+```
+
+Then, update your prompt to include another `MessagesPlaceholder`. This time we'll be passing in the `chat_history` variable from memory.
+
+```typescript
+const prompt = ChatPromptTemplate.fromMessages([
+  ["ai", "You are a helpful assistant"],
+  ["human", "{input}"],
+  new MessagesPlaceholder("agent_scratchpad"),
+  new MessagesPlaceholder("chat_history"),
+]);
+```
+
+Next, inside your `RunnableSequence` add a field for loading the `chat_history` from memory.
+
+```typescript
+const runnableAgent = RunnableSequence.from([
+  {
+    input: (i: { input: string; steps: AgentStep[] }) => i.input,
+    agent_scratchpad: (i: { input: string; steps: AgentStep[] }) =>
+      formatAgentSteps(i.steps),
+    // Load memory here
+    chat_history: async (_: { input: string; steps: AgentStep[] }) => {
+      const { history } = await memory.loadMemoryVariables({});
+      return history;
+    },
+  },
+  prompt,
+  modelWithTools,
+  new OpenAIFunctionsAgentOutputParser(),
+]);
+```
+
+Finally we can call the agent, and save the output after the response is returned.
+
+```typescript
+const query = "What is the weather in New York?";
+console.log(`Calling agent executor with query: ${query}`);
+const result = await executor.call({
+  input: query,
+});
+console.log(result);
+/*
+Calling agent executor with query: What is the weather in New York?
+{
+  output: 'The current weather in New York is sunny with a temperature of 66 degrees Fahrenheit. The humidity is at 54% and the wind is blowing at 6 mph. There is 0% chance of precipitation.'
+}
+*/
+
+// Save the result and initial input to memory
+await memory.saveContext(
+  {
+    question: query,
+  },
+  {
+    answer: result.output,
+  }
+);
+
+const query2 = "Do I need a jacket?";
+const result2 = await executor.call({
+  input: query2,
+});
+console.log(result2);
+/*
+{
+  output: 'Based on the current weather in New York, you may not need a jacket. However, if you feel cold easily or will be outside for a long time, you might want to bring a light jacket just in case.'
+}
+ */
+```
diff --git a/examples/src/agents/openai_runnable.ts b/examples/src/agents/openai_runnable.ts
@@ -36,7 +36,7 @@ const prompt = ChatPromptTemplate.fromMessages([
  * Here we're using the `formatToOpenAIFunction` util function
  * to format our tools into the proper schema for OpenAI functions.
  */
-const modelWithTools = model.bind({
+const modelWithFunctions = model.bind({
   functions: [...tools.map((tool) => formatToOpenAIFunction(tool))],
 });
 /**
@@ -68,7 +68,7 @@ const runnableAgent = RunnableSequence.from([
       formatAgentSteps(i.steps),
   },
   prompt,
-  modelWithTools,
+  modelWithFunctions,
   new OpenAIFunctionsAgentOutputParser(),
 ]);
 /** Pass the runnable along with the tools to create the Agent Executor */

diff --git a/examples/src/agents/openai_tools_runnable.ts b/examples/src/agents/openai_tools_runnable.ts
@@ -0,0 +1,87 @@
+import { z } from "zod";
+import { ChatOpenAI } from "langchain/chat_models/openai";
+import { DynamicStructuredTool } from "langchain/tools";
+import { Calculator } from "langchain/tools/calculator";
+import { BaseMessage, ToolMessage, AIMessage } from "langchain/schema";
+import { ChatPromptTemplate, MessagesPlaceholder } from "langchain/prompts";
+import { RunnableSequence } from "langchain/schema/runnable";
+import { AgentExecutor } from "langchain/agents";
+import {
+  OpenAIToolsAgentOutputParser,
+  type ToolsAgentStep,
+} from "langchain/agents/openai/output_parser";
+
+const model = new ChatOpenAI({
+  modelName: "gpt-3.5-turbo-1106",
+  temperature: 0,
+});
+
+const weatherTool = new DynamicStructuredTool({
+  name: "get_current_weather",
+  description: "Get the current weather in a given location",
+  func: async ({ location }) => {
+    if (location.toLowerCase().includes("tokyo")) {
+      return JSON.stringify({ location, temperature: "10", unit: "celsius" });
+    } else if (location.toLowerCase().includes("san francisco")) {
+      return JSON.stringify({
+        location,
+        temperature: "72",
+        unit: "fahrenheit",
+      });
+    } else {
+      return JSON.stringify({ location, temperature: "22", unit: "celsius" });
+    }
+  },
+  schema: z.object({
+    location: z.string().describe("The city and state, e.g. San Francisco, CA"),
+    unit: z.enum(["celsius", "fahrenheit"]),
+  }),
+});
+
+const tools = [new Calculator(), weatherTool];
+
+const modelWithTools = model.bind({ tools });
+
+const formatAgentSteps = (steps: ToolsAgentStep[]): BaseMessage[] =>
+  steps.flatMap(({ action, observation }) => {
+    if ("messageLog" in action && action.messageLog !== undefined) {
+      const log = action.messageLog as BaseMessage[];
+      return log.concat(
+        new ToolMessage({
+          content: observation,
+          tool_call_id: action.toolCallId,
+        })
+      );
+    } else {
+      return [new AIMessage(action.log)];
+    }
+  });
+
+const prompt = ChatPromptTemplate.fromMessages([
+  ["ai", "You are a helpful assistant"],
+  ["human", "{input}"],
+  new MessagesPlaceholder("agent_scratchpad"),
+]);
+
+const runnableAgent = RunnableSequence.from([
+  {
+    input: (i: { input: string; steps: ToolsAgentStep[] }) => i.input,
+    agent_scratchpad: (i: { input: string; steps: ToolsAgentStep[] }) =>
+      formatAgentSteps(i.steps),
+  },
+  prompt,
+  modelWithTools,
+  new OpenAIToolsAgentOutputParser(),
+]).withConfig({ runName: "OpenAIToolsAgent" });
+
+const executor = AgentExecutor.fromAgentAndTools({
+  agent: runnableAgent,
+  tools,
+});
+
+const res = await executor.invoke({
+  input:
+    "What is the sum of the current temperature in San Francisco, New York, and Tokyo?",
+});
+
+console.log(res);
diff --git a/langchain/package.json b/langchain/package.json
@@ -1364,7 +1364,7 @@
     "langchainhub": "~0.0.6",
     "langsmith": "~0.0.48",
     "ml-distance": "^4.0.0",
-    "openai": "^4.16.1",
+    "openai": "^4.17.0",
     "openapi-types": "^12.1.3",
     "p-queue": "^6.6.2",
     "p-retry": "4",

diff --git a/langchain/src/agents/openai/output_parser.ts b/langchain/src/agents/openai/output_parser.ts
@@ -2,11 +2,15 @@ import type { OpenAI as OpenAIClient } from "openai";
 import {
   AgentAction,
   AgentFinish,
+  AgentStep,
   BaseMessage,
   ChatGeneration,
   isBaseMessage,
 } from "../../schema/index.js";
-import { AgentActionOutputParser } from "../types.js";
+import {
+  AgentActionOutputParser,
+  AgentMultiActionOutputParser,
+} from "../types.js";
 import { OutputParserException } from "../../schema/output_parser.js";
 
 /**
@@ -83,3 +87,88 @@ export class OpenAIFunctionsAgentOutputParser extends AgentActionOutputParser {
     );
   }
 }
+
+/**
+ * Type that represents an agent action with an optional message log.
+ */
+export type ToolsAgentAction = AgentAction & {
+  toolCallId: string;
+  messageLog?: BaseMessage[];
+};
+
+export type ToolsAgentStep = AgentStep & {
+  action: ToolsAgentAction;
+};
+
+export class OpenAIToolsAgentOutputParser extends AgentMultiActionOutputParser {
+  lc_namespace = ["langchain", "agents", "openai"];
+
+  static lc_name() {
+    return "OpenAIToolsAgentOutputParser";
+  }
+
+  async parse(text: string): Promise<AgentAction[] | AgentFinish> {
+    throw new Error(
+      `OpenAIFunctionsAgentOutputParser can only parse messages.\nPassed input: ${text}`
+    );
+  }
+
+  async parseResult(generations: ChatGeneration[]) {
+    if ("message" in generations[0] && isBaseMessage(generations[0].message)) {
+      return this.parseAIMessage(generations[0].message);
+    }
+    throw new Error(
+      "parseResult on OpenAIFunctionsAgentOutputParser only works on ChatGeneration output"
+    );
+  }
+
+  /**
+   * Parses the output message into a ToolsAgentAction[] or AgentFinish
+   * object.
+   * @param message The BaseMessage to parse.
+   * @returns A ToolsAgentAction[] or AgentFinish object.
+   */
+  parseAIMessage(message: BaseMessage): ToolsAgentAction[] | AgentFinish {
+    if (message.content && typeof message.content !== "string") {
+      throw new Error("This agent cannot parse non-string model responses.");
+    }
+    if (message.additional_kwargs.tool_calls) {
+      const toolCalls: OpenAIClient.Chat.ChatCompletionMessageToolCall[] =
+        message.additional_kwargs.tool_calls;
+      try {
+        return toolCalls.map((toolCall, i) => {
+          const toolInput = toolCall.function.arguments
+            ? JSON.parse(toolCall.function.arguments)
+            : {};
+          const messageLog = i === 0 ? [message] : [];
+          return {
+            tool: toolCall.function.name as string,
+            toolInput,
+            toolCallId: toolCall.id,
+            log: `Invoking "${toolCall.function.name}" with ${
+              toolCall.function.arguments ?? "{}"
+            }\n${message.content}`,
+            messageLog,
+          };
+        });
+      } catch (error) {
+        throw new OutputParserException(
+          `Failed to parse tool arguments from chat model response. Text: "${JSON.stringify(
+            toolCalls
+          )}". ${error}`
+        );
+      }
+    } else {
+      return {
+        returnValues: { output: message.content },
+        log: message.content,
+      };
+    }
+  }
+
+  getFormatInstructions(): string {
+    throw new Error(
+      "getFormatInstructions not implemented inside OpenAIFunctionsAgentOutputParser."
+    );
+  }
+}