traceloop
diff --git a/‎packages/ai-semantic-conventions/src/SemanticAttributes.ts‎
Lines changed: 15 additions & 0 deletions b/‎packages/ai-semantic-conventions/src/SemanticAttributes.ts‎
Lines changed: 15 additions & 0 deletions
diff --git a/‎packages/sample-app/src/guardrails/custom_evaluator.ts‎
Lines changed: 148 additions & 0 deletions b/‎packages/sample-app/src/guardrails/custom_evaluator.ts‎
Lines changed: 148 additions & 0 deletions
diff --git a/‎packages/sample-app/src/guardrails/error_handling.ts‎
Lines changed: 201 additions & 0 deletions b/‎packages/sample-app/src/guardrails/error_handling.ts‎
Lines changed: 201 additions & 0 deletions
@@ -16,6 +16,21 @@
 // TODO: Remove unnecessary comments after all instrumentations are updated before (parent branch merge)
 
 export const SpanAttributes = {
+  // Guardrail attributes (custom — not yet in OTel core spec)
+
+  // Parent guardrail span (gen_ai.operation.name = "guardrail.run")
+  GEN_AI_GUARDRAIL_NAME: "gen_ai.guardrail.name",
+  GEN_AI_GUARDRAIL_STATUS: "gen_ai.guardrail.status",
+  GEN_AI_GUARDRAIL_DURATION: "gen_ai.guardrail.duration",
+  GEN_AI_GUARDRAIL_GUARD_COUNT: "gen_ai.guardrail.guard_count",
+  GEN_AI_GUARDRAIL_FAILED_GUARD_COUNT: "gen_ai.guardrail.failed_guard_count",
+
+  // Child guard span (gen_ai.operation.name = "guard")
+  GEN_AI_GUARDRAIL_INPUT: "gen_ai.guardrail.input",
+  GEN_AI_GUARDRAIL_OUTPUT: "gen_ai.guardrail.output",
+  GEN_AI_GUARDRAIL_ERROR_TYPE: "gen_ai.guardrail.error.type",
+  GEN_AI_GUARDRAIL_ERROR_MESSAGE: "gen_ai.guardrail.error.message",
+
   // Attributes not yet in @opentelemetry/semantic-conventions
 
   // TODO: Remove after all instrumentations are updated
 
@@ -0,0 +1,148 @@
+/**
+ * Custom Evaluator Guard Example
+ * ================================
+ * Shows how to use a custom LLM-as-a-judge evaluator as a guard.
+ *
+ * Scenario: a physics education app that only answers physics questions.
+ * The LLM response is checked with the custom evaluator guard to confirm
+ * it actually contains physics content. Off-topic responses are blocked
+ * and replaced with a fallback message.
+ *
+ * The custom evaluator uses a two-call HTTP flow:
+ *   1. POST /v2/evaluators/{slug}/executions  — trigger the LLM judge
+ *   2. GET  /v2{streamUrl}                    — blocking long-poll for result
+ *
+ * Prerequisites:
+ *   - A custom evaluator with slug "custom-test" must exist on your backend.
+ *     The evaluator should return { isValid: boolean, reasoning: string }.
+ *     Its prompt template should use {llm_response} as the input variable.
+ *
+ * Run:
+ *   npm run build && node dist/src/guardrails/custom_evaluator.js
+ *
+ * Environment:
+ *   OPENAI_API_KEY     — OpenAI key
+ *   TRACELOOP_API_KEY  — your Traceloop API key
+ *   TRACELOOP_BASE_URL — https://api.traceloop.dev
+ */
+
+// ── Init — Traceloop FIRST ───────────────────────────────────────────────────
+import * as traceloop from "@traceloop/node-server-sdk";
+import OpenAI from "openai";
+
+traceloop.initialize({
+  appName: "guardrails-custom-evaluator-example",
+  apiKey: process.env.TRACELOOP_API_KEY,
+  baseUrl: process.env.TRACELOOP_BASE_URL,
+  disableBatch: true,
+  silenceInitializationMessage: true,
+  instrumentModules: {
+    // eslint-disable-next-line @typescript-eslint/no-explicit-any
+    openAI: OpenAI as any,
+  },
+});
+
+import {
+  Guardrails,
+  customEvaluatorGuard,
+  isTrue,
+} from "@traceloop/node-server-sdk";
+
+const openai = new OpenAI();
+
+// The slug of the custom evaluator on your Traceloop backend.
+// The evaluator should accept {llm_response} and return { isValid: boolean }.
+const EVALUATOR_SLUG = "custom-test";
+
+const FALLBACK =
+  "I can only help with physics questions. Please ask something related to physics.";
+
+// ── Helpers ───────────────────────────────────────────────────────────────────
+
+async function askLLM(question: string): Promise<string> {
+  const response = await openai.chat.completions.create({
+    model: "gpt-4o-mini",
+    max_tokens: 200,
+    messages: [
+      {
+        role: "system",
+        content:
+          "You are a physics tutor. Answer questions about physics concisely.",
+      },
+      { role: "user", content: question },
+    ],
+  });
+  return response.choices[0]?.message?.content ?? "";
+}
+
+// ── Guard setup ───────────────────────────────────────────────────────────────
+
+// Custom evaluator guard — checks whether the LLM response is about physics.
+// conditionField "isValid" maps to the boolean field in the evaluator output.
+// The custom inputMapper passes the response under the {llm_response} template variable.
+const physicsContentGuard = customEvaluatorGuard(EVALUATOR_SLUG, {
+  conditionField: "isValid",
+  condition: isTrue(),
+  timeoutMs: 60000,
+});
+
+const responseGuard = new Guardrails([physicsContentGuard], {
+  onFailure: FALLBACK,
+  // The custom evaluator template uses {llm_response} — map the LLM output to that field.
+  inputMapper: (output) => [{ llm_response: output as string }],
+});
+
+// ── Main ──────────────────────────────────────────────────────────────────────
+
+async function main(): Promise<void> {
+  await traceloop.withWorkflow(
+    { name: "custom-evaluator-example" },
+    async () => {
+      console.log(
+        "\n── guard() on response — physics question → LLM → evaluator ──",
+      );
+      // A real physics question: LLM answers, custom evaluator confirms it's physics.
+
+      const physicsQuestion =
+        "How does Newton's second law relate force and mass?";
+      console.log(`Question: "${physicsQuestion}"`);
+
+      const llmResponse = await askLLM(physicsQuestion);
+      console.log(`LLM response: "${llmResponse.slice(0, 100)}..."`);
+
+      const start = Date.now();
+      const physicsResult = await responseGuard.run(async () => llmResponse);
+      const duration = Date.now() - start;
+
+      console.log(
+        `Custom evaluator result: ${physicsResult !== FALLBACK ? "✅ physics confirmed" : "🚫 not physics"} (${duration}ms)`,
+      );
+
+      console.log(
+        "\n── off-topic question → LLM → evaluator blocks response ──",
+      );
+      // An off-topic question: LLM answers about cooking, evaluator blocks it.
+
+      const offTopicQuestion = "What is the best way to cook pasta?";
+      console.log(`Question: "${offTopicQuestion}"`);
+
+      const offTopicResponse = await askLLM(offTopicQuestion);
+      console.log(`LLM response: "${offTopicResponse.slice(0, 100)}..."`);
+
+      // run() calls the guard and invokes onFailure (returns FALLBACK) if blocked
+      const finalResponse = await responseGuard.run(
+        async () => offTopicResponse,
+      );
+      console.log(`Response shown to user: "${finalResponse}"`);
+
+      console.log(
+        "\n── done ───────────────────────────────────────────────────",
+      );
+      console.log("Check the Traceloop UI for span details.\n");
+    },
+  );
+
+  await traceloop.forceFlush();
+}
+
+main();
@@ -0,0 +1,201 @@
+/**
+ * Guard Error Handling Example
+ * =============================
+ * Demonstrates that real guard errors (network timeout, HTTP failure, code bug)
+ * propagate as GuardExecutionError — they are NOT silently treated as logical
+ * failures. This matches Python SDK behavior.
+ *
+ * Each example verifies:
+ *   - GuardExecutionError is thrown to the caller
+ *   - The guard span gets ERROR OTel status + error.type/error.message attributes
+ *
+ * Check the Traceloop UI after running — look for spans with red ERROR status.
+ *
+ * Run:
+ *   npm run build && node dist/src/guardrails/error_handling.js
+ *
+ * Environment:
+ *   TRACELOOP_API_KEY  — your Traceloop API key
+ *   TRACELOOP_BASE_URL — https://api.traceloop.dev
+ */
+
+// ── Init — Traceloop FIRST ───────────────────────────────────────────────────
+import * as traceloop from "@traceloop/node-server-sdk";
+
+traceloop.initialize({
+  appName: "guardrails-error-handling-example",
+  apiKey: process.env.TRACELOOP_API_KEY,
+  baseUrl: process.env.TRACELOOP_BASE_URL,
+  disableBatch: true,
+  silenceInitializationMessage: true,
+});
+
+import {
+  Guardrails,
+  validateContent,
+  GuardExecutionError,
+} from "@traceloop/node-server-sdk";
+import type { Guard } from "@traceloop/node-server-sdk";
+
+// ── Helpers ───────────────────────────────────────────────────────────────────
+
+function sep(title: string) {
+  console.log(`\n${"─".repeat(60)}`);
+  console.log(`  ${title}`);
+  console.log("─".repeat(60));
+}
+
+// A guard that always throws a real error (simulates timeout / network failure)
+function makeErrorGuard(message: string): Guard {
+  const g: Guard = async (_input) => {
+    throw new Error(message);
+  };
+  g.guardName = "error-guard";
+  return g;
+}
+
+// A guard that always passes — used alongside error guards in multi-guard cases
+const alwaysPass: Guard = Object.assign(
+  async (_input: Record<string, unknown>) => true,
+  { guardName: "always-pass" },
+);
+
+// ── Example 1: validateContent() propagates GuardExecutionError ─────────────────────
+
+async function example1_validateThrows(): Promise<void> {
+  sep("EXAMPLE 1 — validateContent() throws GuardExecutionError on real error");
+
+  console.log(
+    "  Running validateContent() with a guard that throws a network error...",
+  );
+
+  try {
+    await validateContent("some LLM output", [
+      makeErrorGuard("Simulated network timeout"),
+    ]);
+    console.log("  ❌ ERROR: validateContent() should have thrown but didn't");
+  } catch (err) {
+    if (err instanceof GuardExecutionError) {
+      console.log("  ✅ GuardExecutionError thrown as expected");
+      console.log(`     .message:           "${err.message}"`);
+      console.log(
+        `     .originalException: "${err.originalException.message}"`,
+      );
+      console.log(`     .guardIndex:        ${err.guardIndex}`);
+      console.log(
+        "  ℹ️  Check Traceloop UI: error-guard.guard span → ERROR status,",
+      );
+      console.log("      gen_ai.guardrail.error.type = Error,");
+      console.log(
+        "      gen_ai.guardrail.error.message = Simulated network timeout",
+      );
+    } else {
+      console.log("  ❌ Wrong error type thrown:", err);
+    }
+  }
+}
+
+// ── Example 2: run() propagates GuardExecutionError ──────────────────────────
+
+async function example2_runThrows(): Promise<void> {
+  sep("EXAMPLE 2 — run() throws GuardExecutionError on real error");
+
+  console.log(
+    "  Running Guardrails.run() with a guard that throws an HTTP error...",
+  );
+
+  const g = new Guardrails([makeErrorGuard("HTTP 503: Service Unavailable")], {
+    onFailure: "log",
+  });
+
+  try {
+    await g.run(async () => "LLM response text");
+    console.log("  ❌ ERROR: run() should have thrown but didn't");
+  } catch (err) {
+    if (err instanceof GuardExecutionError) {
+      console.log(
+        "  ✅ GuardExecutionError thrown — onFailure='log' was NOT called",
+      );
+      console.log(`     .message:           "${err.message}"`);
+      console.log(
+        `     .originalException: "${err.originalException.message}"`,
+      );
+      console.log(
+        "  ℹ️  Check Traceloop UI: error-guard.guard span → ERROR status",
+      );
+    } else {
+      console.log("  ❌ Wrong error type thrown:", err);
+    }
+  }
+}
+
+// ── Example 3: parallel().runAll() — one guard errors, one passes ─────────────
+
+async function example3_parallelRunAllThrows(): Promise<void> {
+  sep(
+    "EXAMPLE 3 — parallel().runAll() propagates error even when another guard passes",
+  );
+
+  console.log(
+    "  Running 2 guards in parallel (runAll): alwaysPass + errorGuard...",
+  );
+
+  const g = new Guardrails(
+    [alwaysPass, makeErrorGuard("Evaluator API returned 500")],
+    {},
+  )
+    .parallel()
+    .runAll();
+
+  try {
+    await g.run(async () => "LLM response text");
+    console.log("  ❌ ERROR: run() should have thrown but didn't");
+  } catch (err) {
+    if (err instanceof GuardExecutionError) {
+      console.log(
+        "  ✅ GuardExecutionError propagated from parallel().runAll()",
+      );
+      console.log(`     .message:           "${err.message}"`);
+      console.log(
+        `     .originalException: "${err.originalException.message}"`,
+      );
+      console.log(`     .guardIndex:        ${err.guardIndex}`);
+      console.log("  ℹ️  Check Traceloop UI: always-pass.guard → PASSED,");
+      console.log("      error-guard.guard → ERROR with full exception event");
+    } else {
+      console.log("  ❌ Wrong error type thrown:", err);
+    }
+  }
+}
+
+// ── Main ──────────────────────────────────────────────────────────────────────
+
+async function main(): Promise<void> {
+  console.log(`\n${"═".repeat(60)}`);
+  console.log("  GUARDRAILS ERROR HANDLING EXAMPLE");
+  console.log(
+    `  Backend: ${process.env.TRACELOOP_BASE_URL ?? "https://api.traceloop.dev"}`,
+  );
+  console.log(`${"═".repeat(60)}`);
+  console.log(
+    "\n  Real guard errors throw GuardExecutionError — never silently",
+  );
+  console.log("  treated as logical failures. Check spans for ERROR status.\n");
+
+  await traceloop.withWorkflow(
+    { name: "guardrails-error-handling-workflow" },
+    async () => {
+      await example1_validateThrows();
+      await example2_runThrows();
+      await example3_parallelRunAllThrows();
+    },
+  );
+
+  console.log(`\n${"═".repeat(60)}`);
+  console.log("  ALL EXAMPLES COMPLETE");
+  console.log(`${"═".repeat(60)}\n`);
+
+  await traceloop.forceFlush();
+}
+
+main();