fix: stream utils for deep search

2026-01-10 23:48:26 +00:00 · 2025-10-15 23:18:59 +05:30 · 2025-10-15 23:18:59 +05:30 · 949b534383
commit 949b534383
parent 45a7364e57
2 changed files with 98 additions and 20 deletions
--- a/apps/webapp/app/trigger/deep-search/deep-search-utils.ts
+++ b/apps/webapp/app/trigger/deep-search/deep-search-utils.ts
@ -1,6 +1,7 @@
 import { type CoreMessage } from "ai";
 import { logger } from "@trigger.dev/sdk/v3";
-import { generate, processTag } from "../chat/stream-utils";
+import { generate } from "./stream-utils";
+import { processTag } from "../chat/stream-utils";
 import { type AgentMessage, AgentMessageType, Message } from "../chat/types";
 import { TotalCost } from "../utils/types";

@ -36,7 +37,7 @@ export async function* run(
      logger.info(`ReAct loop iteration ${guardLoop}, searches: ${searchCount}`);

      // Call LLM with current message history
-      const response = generate(messages, false, (event)=>{const usage = event.usage;
+      const response = generate(messages, (event)=>{const usage = event.usage;
        totalCost.inputTokens += usage.promptTokens;
        totalCost.outputTokens += usage.completionTokens;
      }, tools);
@ -95,34 +96,31 @@ export async function* run(
        }
      }

-      // Execute tool calls sequentially
+      // Execute tool calls in parallel for better performance
      if (toolCalls.length > 0) {
+        // Notify about all searches starting
        for (const toolCall of toolCalls) {
-          // Add assistant message with tool call
-          messages.push({
-            role: "assistant",
-            content: [
-              {
-                type: "tool-call",
-                toolCallId: toolCall.toolCallId,
-                toolName: toolCall.toolName,
-                args: toolCall.args,
-              },
-            ],
-          });
-
-          // Execute the search tool
          logger.info(`Executing search: ${JSON.stringify(toolCall.args)}`);
-
-          // Notify about search starting
          yield Message("", AgentMessageType.SKILL_START);
          yield Message(
            `\nSearching memory: "${toolCall.args.query}"...\n`,
            AgentMessageType.SKILL_CHUNK
          );
          yield Message("", AgentMessageType.SKILL_END);
+        }

-          const result = await searchTool.execute(toolCall.args);
+        // Execute all searches in parallel
+        const searchPromises = toolCalls.map((toolCall) =>
+          searchTool.execute(toolCall.args).then((result: any) => ({
+            toolCall,
+            result,
+          }))
+        );
+
+        const searchResults = await Promise.all(searchPromises);
+
+        // Process results and add to message history
+        for (const { toolCall, result } of searchResults) {
          searchCount++;

          // Deduplicate episodes - track unique IDs
@ -141,6 +139,18 @@ export async function* run(
          const episodesInThisSearch = result.episodes?.length || 0;
          totalEpisodesFound = seenEpisodeIds.size; // Use unique count

+          messages.push({
+            role: "assistant",
+            content: [
+              {
+                type: "tool-call",
+                toolCallId: toolCall.toolCallId,
+                toolName: toolCall.toolName,
+                args: toolCall.args,
+              },
+            ],
+          });
+
          // Add tool result to message history
          messages.push({
            role: "tool",
--- a/apps/webapp/app/trigger/deep-search/stream-utils.ts
+++ b/apps/webapp/app/trigger/deep-search/stream-utils.ts
@ -0,0 +1,68 @@
+import { openai } from "@ai-sdk/openai";
+import { logger } from "@trigger.dev/sdk/v3";
+import {
+  type CoreMessage,
+  type LanguageModelV1,
+  streamText,
+  type ToolSet,
+} from "ai";
+
+/**
+ * Generate LLM responses with tool calling support
+ * Simplified version for deep-search use case - NO maxSteps for manual ReAct control
+ */
+export async function* generate(
+  messages: CoreMessage[],
+  onFinish?: (event: any) => void,
+  tools?: ToolSet,
+  model?: string,
+): AsyncGenerator<
+  | string
+  | {
+      type: string;
+      toolName: string;
+      args?: any;
+      toolCallId?: string;
+    }
+> {
+  const modelToUse = model || process.env.MODEL || "gpt-4.1-2025-04-14";
+  const modelInstance = openai(modelToUse) as LanguageModelV1;
+
+  logger.info(`Starting LLM generation with model: ${modelToUse}`);
+
+  try {
+    const { textStream, fullStream } = streamText({
+      model: modelInstance,
+      messages,
+      temperature: 1,
+      tools,
+      // NO maxSteps - we handle tool execution manually in the ReAct loop
+      toolCallStreaming: true,
+      onFinish,
+    });
+
+    // Yield text chunks
+    for await (const chunk of textStream) {
+      yield chunk;
+    }
+
+    // Yield tool calls
+    for await (const fullChunk of fullStream) {
+      if (fullChunk.type === "tool-call") {
+        yield {
+          type: "tool-call",
+          toolName: fullChunk.toolName,
+          toolCallId: fullChunk.toolCallId,
+          args: fullChunk.args,
+        };
+      }
+
+      if (fullChunk.type === "error") {
+        logger.error(`LLM error: ${JSON.stringify(fullChunk)}`);
+      }
+    }
+  } catch (error) {
+    logger.error(`LLM generation error: ${error}`);
+    throw error;
+  }
+}