run-llama
diff --git a/‎.changeset/five-peaches-brush.md‎
Lines changed: 5 additions & 0 deletions b/‎.changeset/five-peaches-brush.md‎
Lines changed: 5 additions & 0 deletions
diff --git a/‎.changeset/red-bushes-brake.md‎
Lines changed: 5 additions & 0 deletions b/‎.changeset/red-bushes-brake.md‎
Lines changed: 5 additions & 0 deletions
diff --git a/‎apps/next/src/content/docs/llamaindex/modules/agents/agent_workflow.mdx‎
Lines changed: 52 additions & 0 deletions b/‎apps/next/src/content/docs/llamaindex/modules/agents/agent_workflow.mdx‎
Lines changed: 52 additions & 0 deletions
diff --git a/‎apps/next/src/content/docs/llamaindex/modules/agents/low-level.mdx‎
Lines changed: 36 additions & 2 deletions b/‎apps/next/src/content/docs/llamaindex/modules/agents/low-level.mdx‎
Lines changed: 36 additions & 2 deletions
diff --git a/‎examples/agents/agent/structured-object.ts‎
Lines changed: 39 additions & 0 deletions b/‎examples/agents/agent/structured-object.ts‎
Lines changed: 39 additions & 0 deletions
diff --git a/‎examples/agents/tools/exec-object.ts‎
Lines changed: 48 additions & 0 deletions b/‎examples/agents/tools/exec-object.ts‎
Lines changed: 48 additions & 0 deletions
diff --git a/‎examples/agents/tools/response-format-exec.ts‎
Lines changed: 4 additions & 2 deletions b/‎examples/agents/tools/response-format-exec.ts‎
Lines changed: 4 additions & 2 deletions
@@ -0,0 +1,5 @@
+---
+"@llamaindex/core": patch
+---
+
+feat: return structured object from llm.exec
@@ -0,0 +1,5 @@
+---
+"@llamaindex/workflow": patch
+---
+
+feat: return structured data when using agent.run()
@@ -37,6 +37,58 @@ console.log(result.data.result); // Baby Llama is called cria
 console.log(result.data.message); // { role: 'assistant', content: 'Baby Llama is called cria' }
 ```
 
+### Structured Output
+
+You can extract structured data from agent responses by providing a `responseFormat` with a Zod schema. This is useful when you need the agent's response in a specific format for further processing:
+
+```typescript
+import { z } from "zod";
+import { tool } from "llamaindex";
+import { agent } from "@llamaindex/workflow";
+import { openai } from "@llamaindex/openai";
+
+// Define a weather tool
+const weatherTool = tool({
+  name: "weatherTool",
+  description: "Get weather information",
+  parameters: z.object({
+    location: z.string(),
+  }),
+  execute: ({ location }) => {
+    return `The weather in ${location} is sunny. The temperature is 72 degrees. The humidity is 50%. The wind speed is 10 mph.`;
+  },
+});
+
+// Define the structure you want for the response
+const responseSchema = z.object({
+  temperature: z.number(),
+  humidity: z.number(),
+  windSpeed: z.number(),
+});
+
+// Create the agent
+const weatherAgent = agent({
+  name: "weatherAgent",
+  tools: [weatherTool],
+  llm: openai({ model: "gpt-4.1-mini" }),
+});
+
+// Run with structured output
+const result = await weatherAgent.run("What's the weather in Tokyo?", {
+  responseFormat: responseSchema,
+});
+
+console.log("Natural language result:", result.data.result);
+console.log("Structured data:", result.data.object);
+// Output: { temperature: 72, humidity: 50, windSpeed: 10 }
+```
+
+The agent will:
+1. Use the weather tool to get the raw weather information
+2. Process that information through the LLM
+3. Extract structured data according to your schema
+4. Return both the natural language response and the structured object
+
 ### Event Streaming
 
 Agent Workflows provide a unified interface for event streaming, making it easy to track and respond to different events during execution:
 
@@ -9,6 +9,7 @@ Sometimes your need more control over LLM interactions than what high-level agen
 Use `llm.exec` when you need to:
 - Build custom agent logic in [workflow](/docs/llamaindex/modules/agents/workflows) steps
 - Have precise control over message handling and tool execution
+- Extract structured data from LLM responses
 
 ## Basic Usage
 
@@ -51,6 +52,38 @@ messages.push(...newMessages);
 
 > `newMessages` is an array as each tool call generates two messages: a tool call message and the tool call result message.
 
+## Structured Output
+
+You can use `responseFormat` with a Zod schema to get structured data from the LLM response:
+
+```ts
+import { openai } from "@llamaindex/openai";
+import { ChatMessage } from "llamaindex";
+import z from "zod";
+
+const llm = openai({ model: "gpt-4.1-mini" });
+
+const schema = z.object({
+  title: z.string(),
+  author: z.string(),
+  year: z.number(),
+});
+
+const messages = [
+  {
+    role: "user",
+    content: "I have been reading La Divina Commedia by Dante Alighieri, published in 1321",
+  } as ChatMessage,
+];
+
+const { newMessages, toolCalls, object } = await llm.exec({
+  messages,
+  responseFormat: schema,
+});
+
+console.log(object); // { title: "La Divina Commedia", author: "Dante Alighieri", year: 1321 }
+```
+
 ## Agent Loop Pattern
 
 A common pattern is to use `llm.exec` in a loop until the LLM stops making tool calls:
@@ -102,7 +135,7 @@ For real-time responses, use the `stream` option to get the assistant's response
 
 ```ts
 import { openai } from "@llamaindex/openai";
-import { tool } from "llamaindex";
+import { ChatMessage, tool } from "llamaindex";
 import z from "zod";
 
 async function streamingAgentLoop() {
@@ -153,6 +186,7 @@ async function streamingAgentLoop() {
 
 - **`newMessages`**: Array of new chat messages including the LLM response and any tool call messages (call or result). This is a function return the array when streaming.
 - **`toolCalls`**: Array of tool calls made by the LLM
+- **`object`**: The structured object when using `responseFormat` with a Zod schema (undefined if no schema is provided)
 - **`stream`**: Async iterable for streaming responses (only when `stream: true`)
 
 ## Best Practices
@@ -161,4 +195,4 @@ For using `llm.exec` in an agent loop, take care to:
 
 1. **Maintain message history**: Always add `newMessages` to your conversation history
 2. **Set exit conditions**: Implement proper logic to avoid infinite loops
-
+3. **Handle structured output**: When using `responseFormat`, the `object` property contains your parsed data
@@ -0,0 +1,39 @@
+import { z } from "zod";
+
+import { openai } from "@llamaindex/openai";
+import { agent } from "@llamaindex/workflow";
+import { tool } from "llamaindex";
+
+const weatherTool = tool({
+  name: "weatherTool",
+  description: "Get weather information",
+  parameters: z.object({
+    location: z.string(),
+  }),
+  execute: ({ location }) => {
+    return `The weather in ${location} is sunny. The temperature is 72 degrees. The humidity is 50%. The wind speed is 10 mph.`;
+  },
+});
+
+const responseSchema = z.object({
+  temperature: z.number(),
+  humidity: z.number(),
+  windSpeed: z.number(),
+});
+
+const myAgent = agent({
+  name: "myAgent",
+  tools: [weatherTool],
+  llm: openai({ model: "gpt-4.1-mini" }),
+});
+
+async function main() {
+  const result = await myAgent.run("What's the weather in Tokyo?", {
+    responseFormat: responseSchema,
+  });
+
+  console.log("result.data.result: ", result.data.result);
+  console.log("result.data.object: ", result.data.object);
+}
+
+main().catch(console.error);
@@ -0,0 +1,48 @@
+import { openai } from "@llamaindex/openai";
+import { ChatMessage } from "llamaindex";
+import z from "zod";
+
+const llm = openai({ model: "gpt-4.1-mini" });
+
+const schema = z.object({
+  title: z.string(),
+  author: z.string(),
+  year: z.number(),
+});
+
+const messages: ChatMessage[] = [
+  {
+    role: "user",
+    content: `I have been reading La Divina Commedia by Dante Alighieri, published in 1321`,
+  },
+];
+
+async function main() {
+  {
+    // Non-streaming
+    const { object } = await llm.exec({ messages, responseFormat: schema });
+    console.log("Non-streaming object:", object);
+  }
+
+  {
+    // Streaming
+    let exit = false;
+    do {
+      const { stream, newMessages, toolCalls, object } = await llm.exec({
+        messages,
+        stream: true,
+        responseFormat: schema,
+      });
+
+      for await (const chunk of stream) {
+        console.log(chunk.delta);
+      }
+      console.log("Streaming object:", object);
+
+      messages.push(...newMessages());
+      exit = toolCalls.length === 0;
+    } while (!exit);
+  }
+}
+
+main().catch(console.error);
@@ -13,6 +13,7 @@ const responseSchema = z.object({
 async function main() {
   const messages: ChatMessage[] = [];
   let toolCalls: ToolCall[] = [];
+  let object: z.infer<typeof responseSchema> | undefined;
   do {
     const result = await llm.exec({
       messages: [
@@ -27,13 +28,14 @@ async function main() {
       ],
       responseFormat: responseSchema,
     });
-    console.log(result.newMessages[0].content);
+    object = result.object;
     messages.push(...result.newMessages);
     toolCalls = result.toolCalls;
   } while (toolCalls.length == 0);
 
-  console.log(messages[1].content);
+  console.log(messages);
   console.log(toolCalls);
+  console.log(object);
 }
 
 main().catch(console.error);
-Original file line number
+Diff line change
@@ @@ -0,0 +1,5 @@ @@
 +---
 +"@llamaindex/core": patch
 +---
++
 +feat: return structured object from llm.exec