From 7f1207db0bdca40b1cea8daa3769af8c62cfa85e Mon Sep 17 00:00:00 2001 From: Tobias Wochinger Date: Wed, 17 Jun 2026 10:46:32 +0200 Subject: [PATCH 1/5] docs(evaluation): document multi-modal datasets --- .../datasets-create-dataset-item.mdx | 42 ++++++++- .../2026-06-18-multi-modal-datasets.mdx | 45 ++++++++++ .../evaluation/experiments/data-model.mdx | 14 +++ .../docs/evaluation/experiments/datasets.mdx | 84 +++++++++++++++++ .../experiments/experiments-via-sdk.mdx | 89 +++++++++++++++++++ .../observability/features/multi-modality.mdx | 4 +- .../deployment/infrastructure/blobstorage.mdx | 6 +- 7 files changed, 279 insertions(+), 5 deletions(-) create mode 100644 content/changelog/2026-06-18-multi-modal-datasets.mdx diff --git a/components-mdx/datasets-create-dataset-item.mdx b/components-mdx/datasets-create-dataset-item.mdx index e3c11dd81b..cf425cdf57 100644 --- a/components-mdx/datasets-create-dataset-item.mdx +++ b/components-mdx/datasets-create-dataset-item.mdx @@ -19,6 +19,24 @@ langfuse.create_dataset_item( ) ``` +You can also add media to dataset item `input`, `expected_output`, or `metadata`: + +```python +from langfuse.media import LangfuseMedia + +langfuse.create_dataset_item( + dataset_name="visual-qa", + input={ + "question": "What is shown in this image?", + "image": LangfuseMedia( + file_path="./example.jpg", + content_type="image/jpeg", + ), + }, + expected_output={"label": "invoice"}, +) +``` + _See [Python SDK](/docs/sdk/python/sdk-v3) docs for details on how to initialize the Python client._ @@ -29,7 +47,7 @@ import { LangfuseClient } from "@langfuse/client"; const langfuse = new LangfuseClient(); -await langfuse.api.datasetItems.create({ +await langfuse.dataset.createItem({ datasetName: "", // any JS object or value input: { @@ -46,6 +64,28 @@ await langfuse.api.datasetItems.create({ }); ``` +You can also add media to dataset item `input`, `expectedOutput`, or `metadata`: + +```ts +import { LangfuseClient, LangfuseMedia } from "@langfuse/client"; +import fs from "node:fs"; + +const langfuse = new LangfuseClient(); + +await langfuse.dataset.createItem({ + datasetName: "visual-qa", + input: { + question: "What is shown in this image?", + image: new LangfuseMedia({ + source: "bytes", + contentBytes: fs.readFileSync("./example.jpg"), + contentType: "image/jpeg", + }), + }, + expectedOutput: { label: "invoice" }, +}); +``` + _See [JS/TS SDK](/docs/sdk/typescript/guide) docs for details on how to initialize the JS/TS client._ diff --git a/content/changelog/2026-06-18-multi-modal-datasets.mdx b/content/changelog/2026-06-18-multi-modal-datasets.mdx new file mode 100644 index 0000000000..ced6217460 --- /dev/null +++ b/content/changelog/2026-06-18-multi-modal-datasets.mdx @@ -0,0 +1,45 @@ +--- +date: 2026-06-18 +title: Multi-modal datasets +description: Create Langfuse dataset items with images, audio, video, documents, and other attachments for SDK-based multi-modal experiments. +author: Tobias Wochinger +canonical: /docs/evaluation/experiments/datasets +--- + +import { ChangelogHeader } from "@/components/changelog/ChangelogHeader"; +import { Book, FlaskConical } from "lucide-react"; + + + +