embedding registry model provider missing

xoxruns · xoxruns · commit c5ee5340e6ca · 2026-02-09T11:01:21.000+01:00
diff --git a/.github/workflows/build-release.yml b/.github/workflows/build-release.yml
@@ -248,7 +248,7 @@ jobs:
           tag_name: ${{ steps.version.outputs.version }}
           name: Release ${{ steps.version.outputs.version }}
           body: |
-            ## Deadend CLI ${{ steps.version.outputs.version }}
+            ## Deadend CLI ${{ steps.version.outputs.version }} Stable version;
             
             ### Server Downloads (RPC Server)
             
@@ -278,6 +278,8 @@ jobs:
             tar -xzf deadend-<platform>-<arch>.tar.gz
             cd deadend-<platform>-<arch>
             sudo cp -r * /usr/local/
+
+            Hope you enjoy the new release, let me know if this works for macos and linux
             ```
           files: |
             artifacts/**/*
diff --git a/deadend_cli/deadend_agent/src/deadend_agent/models/registry.py b/deadend_cli/deadend_agent/src/deadend_agent/models/registry.py
@@ -69,13 +69,23 @@ async def batch_embed(self, input_texts: list[str]) -> list[dict]:
             #
             # NOTE:
             # - `self.model` should follow the LiteLLM model name convention,
-            #   e.g. "openai:text-embedding-3-small" or "openrouter:qwen/qwen3-embedding-8b".
+            #   e.g. "openai/text-embedding-3-small" or "openrouter/qwen/qwen3-embedding-8b".
             # - API keys / base URLs are expected to be configured via LiteLLM
-            #   environment variables or global configuration.
-            data = await aembedding(
-                model=self.model,
-                input=input_texts,
-            )
+            #   environment variables or passed explicitly below.
+            kwargs: dict = {
+                "model": self.model,
+                "input": input_texts,
+            }
+
+            # For custom endpoints, we need api_key and api_base
+            if self.base_url:
+                kwargs["api_base"] = self.base_url
+
+            # API key handling
+            if self.api_key:
+                kwargs["api_key"] = self.api_key
+
+            data = await aembedding(**kwargs)
         except Exception as exc:  # pragma: no cover - defensive logging
             logger.error("Embedding call via LiteLLM failed: %s", exc)
             raise ValueError(f"Embedding API error: {exc}") from exc
@@ -168,8 +178,10 @@ def _initialize_models(self, config: Config):
                     # Use the first embedding spec we encounter as the embedder client
                     if self.embedder_model is None:
                         # api_key, base_url = self._resolve_embedding_credentials(spec)
+                        # LiteLLM expects model identifiers in the form "provider/model_name"
+                        # e.g. "openai/text-embedding-3-small" or "openrouter/qwen/qwen3-embedding-8b".
                         self.embedder_model = EmbedderClient(
-                            model_name=spec.model_name,
+                            model_name=f"{spec.provider}/{spec.model_name}",
                             api_key=spec.api_key,
                             base_url=spec.base_url,
                         )