Add Tavily search and extract workflow nodes

bchapuis · claude · bchapuis · commit c145105848e8 · 2026-04-07T01:54:26.000+02:00
Integrate Tavily API for web search and content extraction with two new
nodes gated on TAVILY_API_KEY env variable.

Co-Authored-By: Claude Opus 4.6 (1M context) &lt;noreply@anthropic.com&gt;
diff --git a/apps/api/.dev.vars.example b/apps/api/.dev.vars.example
@@ -27,6 +27,9 @@ GOOGLE_API_KEY=CHANGE_ME
 # Replicate
 REPLICATE_API_TOKEN=CHANGE_ME
 
+# Tavily
+TAVILY_API_KEY=CHANGE_ME
+
 # Integration OAuth (workflow integrations)
 # Use separate OAuth apps from authentication for security isolation
 # Each integration requires different scopes and redirect URIs
diff --git a/apps/api/src/context.ts b/apps/api/src/context.ts
@@ -62,6 +62,7 @@ export interface Bindings {
   HUGGINGFACE_API_KEY?: string;
   REPLICATE_API_TOKEN?: string;
   GOOGLE_API_KEY?: string;
+  TAVILY_API_KEY?: string;
   R2_ACCESS_KEY_ID?: string;
   R2_SECRET_ACCESS_KEY?: string;
   R2_BUCKET_NAME?: string;
diff --git a/apps/api/src/runtime/cloudflare-node-registry.ts b/apps/api/src/runtime/cloudflare-node-registry.ts
@@ -407,6 +407,8 @@ import { SubmitCommentRedditNode } from "@dafthunk/runtime/nodes/reddit/submit-c
 import { VoteRedditNode } from "@dafthunk/runtime/nodes/reddit/vote-reddit-node";
 import { ReplicateModelNode } from "@dafthunk/runtime/nodes/replicate/replicate-model-node";
 import { ReceiveScheduledTriggerNode } from "@dafthunk/runtime/nodes/scheduled/receive-scheduled-trigger-node";
+import { ExtractTavilyNode } from "@dafthunk/runtime/nodes/tavily/extract-tavily-node";
+import { SearchTavilyNode } from "@dafthunk/runtime/nodes/tavily/search-tavily-node";
 import { BotForwardMessageTelegramNode } from "@dafthunk/runtime/nodes/telegram/bot-forward-message-telegram-node";
 import { BotGetChatTelegramNode } from "@dafthunk/runtime/nodes/telegram/bot-get-chat-telegram-node";
 import { BotReceiveTelegramMessageNode } from "@dafthunk/runtime/nodes/telegram/bot-receive-telegram-message-node";
@@ -736,6 +738,12 @@ export class CloudflareNodeRegistry extends BaseNodeRegistry<Bindings> {
     this.registerImplementation(SearchWikipediaNode);
     this.registerImplementation(SearchMediaWikiNode);
 
+    // Tavily nodes
+    if (this.env.TAVILY_API_KEY) {
+      this.registerImplementation(SearchTavilyNode);
+      this.registerImplementation(ExtractTavilyNode);
+    }
+
     // Google API nodes
     if (this.env.GOOGLE_API_KEY) {
       this.registerImplementation(AirQualityGoogleNode);
diff --git a/packages/runtime/src/node-types.ts b/packages/runtime/src/node-types.ts
@@ -217,6 +217,7 @@ export interface NodeEnv {
   HUGGINGFACE_API_KEY?: string;
   REPLICATE_API_TOKEN?: string;
   GOOGLE_API_KEY?: string;
+  TAVILY_API_KEY?: string;
 }
 
 export interface NodeContext {
diff --git a/packages/runtime/src/nodes/tavily/extract-tavily-node.test.ts b/packages/runtime/src/nodes/tavily/extract-tavily-node.test.ts
@@ -0,0 +1,152 @@
+import type { NodeContext } from "@dafthunk/runtime";
+import type { Node } from "@dafthunk/types";
+import { beforeEach, describe, expect, it, vi } from "vitest";
+import { ExtractTavilyNode } from "./extract-tavily-node";
+
+global.fetch = vi.fn();
+
+describe("ExtractTavilyNode", () => {
+  beforeEach(() => vi.clearAllMocks());
+
+  const createContext = (
+    inputs: Record<string, unknown>,
+    env: Record<string, string> = {}
+  ): NodeContext =>
+    ({
+      nodeId: "extract-tavily",
+      inputs,
+      organizationId: "test-org",
+      env,
+    }) as unknown as NodeContext;
+
+  const createNode = () =>
+    new ExtractTavilyNode({
+      nodeId: "extract-tavily",
+    } as unknown as Node);
+
+  it("should return error for missing urls", async () => {
+    const result = await createNode().execute(
+      createContext({}, { TAVILY_API_KEY: "tvly-test" })
+    );
+    expect(result.status).toBe("error");
+    expect(result.error).toContain("Missing required input: urls");
+  });
+
+  it("should return error for invalid urls type", async () => {
+    const result = await createNode().execute(
+      createContext({ urls: 123 }, { TAVILY_API_KEY: "tvly-test" })
+    );
+    expect(result.status).toBe("error");
+    expect(result.error).toContain("Invalid input type for urls");
+  });
+
+  it("should return error for missing API key", async () => {
+    const result = await createNode().execute(
+      createContext({ urls: ["https://example.com"] })
+    );
+    expect(result.status).toBe("error");
+    expect(result.error).toContain("TAVILY_API_KEY");
+  });
+
+  it("should extract content from URLs", async () => {
+    (global.fetch as ReturnType<typeof vi.fn>).mockResolvedValue({
+      ok: true,
+      json: async () => ({
+        results: [
+          {
+            url: "https://example.com",
+            raw_content: "# Example\nPage content here.",
+          },
+        ],
+        failed_results: [],
+        response_time: 1.2,
+      }),
+    });
+
+    const result = await createNode().execute(
+      createContext(
+        { urls: ["https://example.com"] },
+        { TAVILY_API_KEY: "tvly-test" }
+      )
+    );
+
+    expect(result.status).toBe("completed");
+    expect(result.outputs?.results).toEqual([
+      {
+        url: "https://example.com",
+        content: "# Example\nPage content here.",
+      },
+    ]);
+    expect(result.outputs?.count).toBe(1);
+    expect(result.outputs?.failedResults).toEqual([]);
+  });
+
+  it("should accept a single URL string", async () => {
+    (global.fetch as ReturnType<typeof vi.fn>).mockResolvedValue({
+      ok: true,
+      json: async () => ({
+        results: [{ url: "https://example.com", raw_content: "Content" }],
+        failed_results: [],
+        response_time: 0.5,
+      }),
+    });
+
+    await createNode().execute(
+      createContext(
+        { urls: "https://example.com" },
+        { TAVILY_API_KEY: "tvly-test" }
+      )
+    );
+
+    const fetchCall = (global.fetch as ReturnType<typeof vi.fn>).mock.calls[0];
+    const body = JSON.parse(fetchCall[1].body);
+    expect(body.urls).toEqual(["https://example.com"]);
+  });
+
+  it("should report failed extractions", async () => {
+    (global.fetch as ReturnType<typeof vi.fn>).mockResolvedValue({
+      ok: true,
+      json: async () => ({
+        results: [],
+        failed_results: [
+          {
+            url: "https://blocked.com",
+            error: "Access denied",
+          },
+        ],
+        response_time: 0.8,
+      }),
+    });
+
+    const result = await createNode().execute(
+      createContext(
+        { urls: ["https://blocked.com"] },
+        { TAVILY_API_KEY: "tvly-test" }
+      )
+    );
+
+    expect(result.status).toBe("completed");
+    expect(result.outputs?.results).toEqual([]);
+    expect(result.outputs?.failedResults).toEqual([
+      { url: "https://blocked.com", error: "Access denied" },
+    ]);
+    expect(result.outputs?.count).toBe(0);
+  });
+
+  it("should handle API errors", async () => {
+    (global.fetch as ReturnType<typeof vi.fn>).mockResolvedValue({
+      ok: false,
+      status: 401,
+    });
+
+    const result = await createNode().execute(
+      createContext(
+        { urls: ["https://example.com"] },
+        { TAVILY_API_KEY: "tvly-bad-key" }
+      )
+    );
+
+    expect(result.status).toBe("error");
+    expect(result.error).toContain("401");
+  });
+});
diff --git a/packages/runtime/src/nodes/tavily/extract-tavily-node.ts b/packages/runtime/src/nodes/tavily/extract-tavily-node.ts
@@ -0,0 +1,155 @@
+import { ExecutableNode, type NodeContext } from "@dafthunk/runtime";
+import type { NodeExecution, NodeType } from "@dafthunk/types";
+
+interface TavilyExtractResult {
+  url: string;
+  raw_content: string;
+}
+
+interface TavilyExtractFailedResult {
+  url: string;
+  error: string;
+}
+
+interface TavilyExtractResponse {
+  results: TavilyExtractResult[];
+  failed_results: TavilyExtractFailedResult[];
+  response_time: number;
+}
+
+export class ExtractTavilyNode extends ExecutableNode {
+  public static readonly nodeType: NodeType = {
+    id: "extract-tavily",
+    name: "Extract (Tavily)",
+    type: "extract-tavily",
+    description: "Extract content from web pages using Tavily",
+    tags: ["Extract", "Web", "Tavily"],
+    icon: "file-text",
+    documentation:
+      "Extract clean, structured content from one or more web pages using the Tavily Extract API. Returns the page content in markdown or text format.",
+    usage: 10,
+    subscription: true,
+    asTool: true,
+    inputs: [
+      {
+        name: "urls",
+        type: "json",
+        description: "URL string or array of URLs to extract content from",
+        required: true,
+      },
+      {
+        name: "extractDepth",
+        type: "string",
+        description:
+          "Extraction depth: basic (1 credit per 5) or advanced (2 credits per 5). Defaults to basic.",
+        required: false,
+        hidden: true,
+      },
+      {
+        name: "format",
+        type: "string",
+        description: "Output format: markdown or text. Defaults to markdown.",
+        required: false,
+        hidden: true,
+      },
+      {
+        name: "includeImages",
+        type: "boolean",
+        description: "Include extracted image URLs. Defaults to false.",
+        required: false,
+        hidden: true,
+      },
+    ],
+    outputs: [
+      {
+        name: "results",
+        type: "json",
+        description: "Array of extracted content objects with url and content",
+      },
+      {
+        name: "failedResults",
+        type: "json",
+        description: "Array of URLs that failed to extract with error messages",
+        hidden: true,
+      },
+      {
+        name: "count",
+        type: "number",
+        description: "Number of successfully extracted pages",
+        hidden: true,
+      },
+    ],
+  };
+
+  async execute(context: NodeContext): Promise<NodeExecution> {
+    try {
+      const { urls, extractDepth, format, includeImages } = context.inputs;
+
+      if (urls === null || urls === undefined) {
+        return this.createErrorResult("Missing required input: urls");
+      }
+
+      const urlList = typeof urls === "string" ? [urls] : urls;
+      if (!Array.isArray(urlList) || urlList.length === 0) {
+        return this.createErrorResult(
+          `Invalid input type for urls: expected string or non-empty array of strings, got ${typeof urls}`
+        );
+      }
+
+      const { TAVILY_API_KEY } = context.env;
+      if (!TAVILY_API_KEY) {
+        return this.createErrorResult(
+          "TAVILY_API_KEY environment variable is not configured"
+        );
+      }
+
+      const body: Record<string, unknown> = { urls: urlList };
+
+      if (extractDepth && typeof extractDepth === "string") {
+        body.extract_depth = extractDepth;
+      }
+      if (format && typeof format === "string") {
+        body.format = format;
+      }
+      if (includeImages) {
+        body.include_images = true;
+      }
+
+      const response = await fetch("https://api.tavily.com/extract", {
+        method: "POST",
+        headers: {
+          Authorization: `Bearer ${TAVILY_API_KEY}`,
+          "Content-Type": "application/json",
+        },
+        body: JSON.stringify(body),
+      });
+
+      if (!response.ok) {
+        return this.createErrorResult(
+          `Tavily API request failed with status ${response.status}`
+        );
+      }
+
+      const data = (await response.json()) as TavilyExtractResponse;
+
+      const results = data.results.map((item) => ({
+        url: item.url,
+        content: item.raw_content,
+      }));
+
+      const failedResults = data.failed_results.map((item) => ({
+        url: item.url,
+        error: item.error,
+      }));
+
+      return this.createSuccessResult({
+        results,
+        failedResults,
+        count: results.length,
+      });
+    } catch (err) {
+      const error = err as Error;
+      return this.createErrorResult(`Error in ExtractTavily: ${error.message}`);
+    }
+  }
+}
diff --git a/packages/runtime/src/nodes/tavily/search-tavily-node.test.ts b/packages/runtime/src/nodes/tavily/search-tavily-node.test.ts
diff --git a/packages/runtime/src/nodes/tavily/search-tavily-node.ts b/packages/runtime/src/nodes/tavily/search-tavily-node.ts

Original file line number	Diff line number	Diff line change
`@@ -217,6 +217,7 @@ export interface NodeEnv {`
`217`	`217`	`HUGGINGFACE_API_KEY?: string;`
`218`	`218`	`REPLICATE_API_TOKEN?: string;`
`219`	`219`	`GOOGLE_API_KEY?: string;`
	`220`	`+ TAVILY_API_KEY?: string;`
`220`	`221`	`}`
`221`	`222`
`222`	`223`	`export interface NodeContext {`