NVIDIA-NeMo
diff --git a/‎.github/CODEOWNERS‎
Lines changed: 1 addition & 0 deletions b/‎.github/CODEOWNERS‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎docs/catalog.md‎
Lines changed: 1 addition & 0 deletions b/‎docs/catalog.md‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎plugins/data-designer-visual-search/CODEOWNERS‎
Lines changed: 3 additions & 0 deletions b/‎plugins/data-designer-visual-search/CODEOWNERS‎
Lines changed: 3 additions & 0 deletions
diff --git a/‎plugins/data-designer-visual-search/README.md‎
Lines changed: 58 additions & 0 deletions b/‎plugins/data-designer-visual-search/README.md‎
Lines changed: 58 additions & 0 deletions
diff --git a/‎plugins/data-designer-visual-search/pyproject.toml‎
Lines changed: 38 additions & 0 deletions b/‎plugins/data-designer-visual-search/pyproject.toml‎
Lines changed: 38 additions & 0 deletions
diff --git a/‎plugins/data-designer-visual-search/src/data_designer_visual_search/__init__.py‎
Lines changed: 2 additions & 0 deletions b/‎plugins/data-designer-visual-search/src/data_designer_visual_search/__init__.py‎
Lines changed: 2 additions & 0 deletions
diff --git a/‎plugins/data-designer-visual-search/src/data_designer_visual_search/config.py‎
Lines changed: 105 additions & 0 deletions b/‎plugins/data-designer-visual-search/src/data_designer_visual_search/config.py‎
Lines changed: 105 additions & 0 deletions
@@ -8,3 +8,4 @@
 
 # Plugins
 /plugins/data-designer-template/ @NVIDIA-NeMo/data_designer_reviewers
+/plugins/data-designer-visual-search/ eric.tramel@gmail.com
@@ -5,3 +5,4 @@ Auto-generated from plugin metadata. Do not edit manually.
 | Plugin | Version | Column Type | Description |
 |--------|---------|-------------|-------------|
 | data-designer-template | 0.1.0 | `text-transform` | Template Data Designer plugin — text transform column generator |
+| data-designer-visual-search | 0.1.0 | `visual-search` | Data Designer visual-search plugin |
@@ -0,0 +1,3 @@
+# Owner(s) of this plugin — used to generate the root CODEOWNERS file.
+# GitHub accepts @username, @org/team, or email format.
+* eric.tramel@gmail.com
@@ -0,0 +1,58 @@
+# data-designer-visual-search
+
+Data Designer plugin for VLM-driven visual search over image columns.
+
+The `visual-search` column runs a vision-capable chat model with built-in
+image-operation tools:
+
+- `open_image`
+- `get_image_info`
+- `list_images`
+- `crop_image`
+- `transform_image`
+- `edit_color`
+
+Each operation returns an `image_id`. The column keeps intermediate images in
+memory and re-attaches tool-produced images to the following model turn, so the
+model can inspect a crop or transformed image before deciding what to do next.
+Because IDs remain addressable, the model can branch from an earlier image
+rather than being forced through a linear edit chain.
+
+## Installation
+
+```bash
+pip install data-designer-visual-search
+```
+
+## Usage
+
+Once installed, the `visual-search` column type is automatically discovered by
+[NeMo Data Designer](https://github.com/NVIDIA-NeMo/DataDesigner).
+
+```python
+import pandas as pd
+from data_designer.config.config_builder import DataDesignerConfigBuilder
+from data_designer.config.seed_source_dataframe import DataFrameSeedSource
+from data_designer.interface.data_designer import DataDesigner
+
+seed_df = pd.DataFrame({"image_path": ["/path/to/scene.png"]})
+
+builder = DataDesignerConfigBuilder()
+builder.with_seed_dataset(DataFrameSeedSource(df=seed_df))
+builder.add_column(
+    name="visual_answer",
+    column_type="visual-search",
+    image_column="image_path",
+    prompt="Find the red object. Crop or transform the image if that helps.",
+    model_alias="nvidia-vision",
+    # Optional: set a model-specific image token here if your endpoint requires
+    # one in the text for every attached image.
+    # image_placeholder="<image>",
+)
+
+result = DataDesigner(artifact_path="artifacts").preview(builder, num_records=1)
+```
+
+The main output column contains the model's final answer. By default the plugin
+also writes `{column_name}__image_history`, a compact tree of image IDs, parent
+IDs, operations, and dimensions.
@@ -0,0 +1,38 @@
+# SPDX-FileCopyrightText: Copyright (c) 2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+# SPDX-License-Identifier: Apache-2.0
+
+[project]
+name = "data-designer-visual-search"
+version = "0.1.0"
+description = "Data Designer visual-search plugin"
+requires-python = ">=3.10"
+dependencies = [
+    "data-designer>=0.5.7",
+    "pillow",
+    "requests",
+]
+license = "Apache-2.0"
+readme = "README.md"
+authors = [
+    {name = "NVIDIA Corporation"},
+]
+classifiers = [
+    "Development Status :: 3 - Alpha",
+    "Programming Language :: Python :: 3",
+]
+
+[project.entry-points."data_designer.plugins"]
+visual-search = "data_designer_visual_search.plugin:plugin"
+
+[project.urls]
+Repository = "https://github.com/NVIDIA-NeMo/DataDesignerPlugins"
+
+[build-system]
+requires = ["hatchling"]
+build-backend = "hatchling.build"
+
+[tool.hatch.build.targets.wheel]
+packages = ["src/data_designer_visual_search"]
+
+[tool.ruff]
+extend = "../../pyproject.toml"
@@ -0,0 +1,2 @@
+# SPDX-FileCopyrightText: Copyright (c) 2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+# SPDX-License-Identifier: Apache-2.0
@@ -0,0 +1,105 @@
+# SPDX-FileCopyrightText: Copyright (c) 2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+# SPDX-License-Identifier: Apache-2.0
+
+from typing import Literal
+
+from data_designer.config.base import SingleColumnConfig
+from data_designer.config.models import ModalityDataType
+from data_designer.config.utils.constants import REASONING_CONTENT_COLUMN_POSTFIX, TRACE_COLUMN_POSTFIX
+from data_designer.config.utils.image_helpers import ImageFormat
+from data_designer.config.utils.misc import assert_valid_jinja2_template, extract_keywords_from_jinja2_template
+from data_designer.config.utils.trace_type import TraceType
+from pydantic import Field, model_validator
+from typing_extensions import Self
+
+VisualSearchToolName = Literal[
+    "open_image",
+    "get_image_info",
+    "list_images",
+    "crop_image",
+    "transform_image",
+    "edit_color",
+]
+
+
+class VisualSearchColumnConfig(SingleColumnConfig):
+    """Configuration for image-grounded visual search with local image-operation tools.
+
+    The column runs a vision-capable chat model with built-in image tools. Each tool
+    returns an image ID, and subsequent calls may operate on any previous image ID,
+    which lets the model branch from earlier points in the image history.
+    """
+
+    column_type: Literal["visual-search"] = "visual-search"
+
+    image_column: str = Field(description="Column containing a local image path, URL, base64 string, or data URI.")
+    prompt: str = Field(description="Jinja2 prompt template for the visual search task.")
+    model_alias: str = Field(description="Alias of the vision-capable chat model to use.")
+    system_prompt: str | None = Field(default=None, description="Optional Jinja2 system prompt template.")
+    image_data_type: ModalityDataType | None = Field(
+        default=None,
+        description="Optional explicit format for values in image_column. Leave unset for auto-detection.",
+    )
+    image_format: ImageFormat | None = Field(
+        default=None,
+        description="Required when image_data_type is base64 and the image format cannot be auto-detected.",
+    )
+    image_placeholder: str | None = Field(
+        default=None,
+        description="Optional model-specific image token to include in text for endpoints that require it.",
+    )
+    max_tool_call_turns: int = Field(
+        default=6,
+        ge=1,
+        description="Maximum tool-calling turns allowed for each row before the model must answer.",
+    )
+    allowed_tools: list[VisualSearchToolName] | None = Field(
+        default=None,
+        description="Optional allowlist of built-in visual tools. Defaults to all tools.",
+    )
+    attach_images_after_tool_calls: bool = Field(
+        default=True,
+        description="Attach resulting tool images back into the next model turn.",
+    )
+    include_image_history: bool = Field(
+        default=True,
+        description="Add a side-effect column with the tree of image operations and IDs.",
+    )
+    with_trace: TraceType = Field(default=TraceType.NONE, description="Optional chat trace capture mode.")
+    extract_reasoning_content: bool = Field(
+        default=False,
+        description="If True, capture reasoning_content from the final assistant message.",
+    )
+    use_default_system_prompt: bool = Field(
+        default=True,
+        description="Prepend built-in instructions explaining image IDs and visual tools.",
+    )
+
+    @staticmethod
+    def get_column_emoji() -> str:
+        return "🔎"
+
+    @property
+    def required_columns(self) -> list[str]:
+        required_cols = [self.image_column, *extract_keywords_from_jinja2_template(self.prompt)]
+        if self.system_prompt:
+            required_cols.extend(extract_keywords_from_jinja2_template(self.system_prompt))
+        return list(dict.fromkeys(required_cols))
+
+    @property
+    def side_effect_columns(self) -> list[str]:
+        return [
+            *([f"{self.name}__image_history"] if self.include_image_history else []),
+            *([f"{self.name}{TRACE_COLUMN_POSTFIX}"] if self.with_trace != TraceType.NONE else []),
+            *([f"{self.name}{REASONING_CONTENT_COLUMN_POSTFIX}"] if self.extract_reasoning_content else []),
+        ]
+
+    @model_validator(mode="after")
+    def validate_templates_and_image_format(self) -> Self:
+        """Validate prompt templates and image modality settings."""
+        assert_valid_jinja2_template(self.prompt)
+        if self.system_prompt:
+            assert_valid_jinja2_template(self.system_prompt)
+        if self.image_data_type == ModalityDataType.BASE64 and self.image_format is None:
+            raise ValueError("image_format is required when image_data_type is base64")
+        return self
Original file line number	Diff line number	Diff line change
`@@ -8,3 +8,4 @@`
`8`	`8`
`9`	`9`	`# Plugins`
`10`	`10`	`/plugins/data-designer-template/ @NVIDIA-NeMo/data_designer_reviewers`
	`11`	`+/plugins/data-designer-visual-search/ eric.tramel@gmail.com`
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,3 @@`
	`1`	`+# Owner(s) of this plugin — used to generate the root CODEOWNERS file.`
	`2`	`+# GitHub accepts @username, @org/team, or email format.`
	`3`	`+* eric.tramel@gmail.com`
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,2 @@`
	`1`	`+# SPDX-FileCopyrightText: Copyright (c) 2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.`
	`2`	`+# SPDX-License-Identifier: Apache-2.0`