VectifyAI
diff --git a/‎bench/benchmark_retrievers.py‎
Lines changed: 645 additions & 0 deletions b/‎bench/benchmark_retrievers.py‎
Lines changed: 645 additions & 0 deletions
diff --git a/‎bench/build_context7_fs.py‎
Lines changed: 104 additions & 0 deletions b/‎bench/build_context7_fs.py‎
Lines changed: 104 additions & 0 deletions
diff --git a/‎bench/filesystem/context7/queries.json‎
Lines changed: 24 additions & 0 deletions b/‎bench/filesystem/context7/queries.json‎
Lines changed: 24 additions & 0 deletions
diff --git a/‎bench/filesystem/context7/tree.json‎
Lines changed: 242 additions & 0 deletions b/‎bench/filesystem/context7/tree.json‎
Lines changed: 242 additions & 0 deletions
diff --git a/‎bench/fs_block_beam_vertical.json‎
Lines changed: 67 additions & 0 deletions b/‎bench/fs_block_beam_vertical.json‎
Lines changed: 67 additions & 0 deletions
diff --git a/‎bench/fs_block_beam_vertical.md‎
Lines changed: 16 additions & 0 deletions b/‎bench/fs_block_beam_vertical.md‎
Lines changed: 16 additions & 0 deletions
@@ -0,0 +1,104 @@
+#!/usr/bin/env python3
+"""Build Context7 filesystem corpus as one JSON tree file."""
+
+from __future__ import annotations
+
+import json
+import os
+import re
+import urllib.request
+from datetime import datetime, timezone
+from pathlib import Path
+from urllib.parse import urlparse
+
+BASE_DIR = Path(__file__).resolve().parent / "filesystem" / "context7"
+LLMS_TXT_URL = "https://context7.com/docs/llms.txt"
+TREE_FILENAME = "tree.json"
+# 0 means "all docs found in llms.txt".
+MAX_DOCS = int(os.environ.get("CONTEXT7_MAX_DOCS", "0"))
+TIMEOUT = 15
+
+
+def fetch_text(url: str) -> str:
+    req = urllib.request.Request(
+        url, headers={"User-Agent": "ConDB-context7-builder/1.0"}
+    )
+    with urllib.request.urlopen(req, timeout=TIMEOUT) as resp:
+        return resp.read().decode("utf-8", errors="replace")
+
+
+def parse_doc_urls(llms_txt: str) -> list[str]:
+    urls = re.findall(r"\((https://context7\.com/docs/[^)]+)\)", llms_txt)
+    dedup: list[str] = []
+    seen: set[str] = set()
+    for url in urls:
+        if url in seen:
+            continue
+        seen.add(url)
+        dedup.append(url)
+    return dedup
+
+
+def logical_path_for_url(url: str) -> str:
+    path = urlparse(url).path.lstrip("/")
+    if not path:
+        path = "index.md"
+    if path.endswith("/"):
+        path += "index.md"
+    if "." not in Path(path).name:
+        path += ".md"
+    return path
+
+
+def write_tree_file(out_path: Path, docs: list[dict[str, str]]) -> None:
+    payload = {
+        "generated_at": datetime.now(timezone.utc).isoformat(),
+        "source_index": LLMS_TXT_URL,
+        "docs_count": len(docs),
+        "docs": docs,
+    }
+    out_path.write_text(json.dumps(payload, ensure_ascii=False, indent=2), encoding="utf-8")
+
+
+def main() -> None:
+    BASE_DIR.mkdir(parents=True, exist_ok=True)
+
+    llms_txt = fetch_text(LLMS_TXT_URL)
+    all_doc_urls = parse_doc_urls(llms_txt)
+    doc_urls = [url for url in all_doc_urls if url.endswith(".md")]
+    if not doc_urls:
+        raise RuntimeError(f"no markdown doc urls found from {LLMS_TXT_URL}")
+    if MAX_DOCS > 0:
+        doc_urls = doc_urls[:MAX_DOCS]
+
+    docs: list[dict[str, str]] = []
+    errors: list[dict[str, str]] = []
+
+    for url in doc_urls:
+        try:
+            content = fetch_text(url)
+            path = logical_path_for_url(url)
+            docs.append({"url": url, "path": path, "content": content})
+            print(f"+ {url} -> {TREE_FILENAME}::{path}")
+        except Exception as e:  # noqa: BLE001
+            errors.append({"url": url, "error": str(e)})
+            print(f"! failed: {url} ({e})")
+
+    if not docs:
+        raise RuntimeError(f"failed to fetch any context7 docs; errors={len(errors)}")
+
+    tree_path = BASE_DIR / TREE_FILENAME
+    write_tree_file(tree_path, docs)
+
+    print(
+        f"done: docs={len(docs)} errors={len(errors)} "
+        f"tree={tree_path}"
+    )
+    if errors:
+        print("error_summary:")
+        for err in errors:
+            print(f"- {err['url']} :: {err['error']}")
+
+
+if __name__ == "__main__":
+    main()
@@ -0,0 +1,24 @@
+{
+  "queries": [
+    {
+      "query": "Where is the API guide for Context7?",
+      "ground_truth": ["docs/api-guide.md"]
+    },
+    {
+      "query": "Where is the overview page for Context7 agentic tools?",
+      "ground_truth": ["docs/agentic-tools/overview.md"]
+    },
+    {
+      "query": "Where is the query-docs tool documented in AI SDK tools?",
+      "ground_truth": ["docs/agentic-tools/ai-sdk/tools/query-docs.md"]
+    },
+    {
+      "query": "Where is the resolve-library-id tool documented?",
+      "ground_truth": ["docs/agentic-tools/ai-sdk/tools/resolve-library-id.md"]
+    },
+    {
+      "query": "Where is the API reference for adding a GitHub repository?",
+      "ground_truth": ["docs/api-reference/add-library/add-a-github-repository.md"]
+    }
+  ]
+}
@@ -0,0 +1,67 @@
+{
+  "generated_at_utc": "2026-03-18T11:28:35.747027+00:00",
+  "rows": [
+    {
+      "scenario": "context7",
+      "retriever": "Block",
+      "queries_ok": 5,
+      "queries_total": 5,
+      "avg_time_s": 5.46975998878479,
+      "avg_llm_calls": 1.0,
+      "total_cost": 0.07618710000000001,
+      "hit1": 1.0,
+      "hit10": 1.0
+    },
+    {
+      "scenario": "context7",
+      "retriever": "Beam",
+      "queries_ok": 5,
+      "queries_total": 5,
+      "avg_time_s": 20.17977318763733,
+      "avg_llm_calls": 4.6,
+      "total_cost": 0.132762,
+      "hit1": 0.6,
+      "hit10": 0.8
+    },
+    {
+      "scenario": "context7",
+      "retriever": "Vertical",
+      "queries_ok": 5,
+      "queries_total": 5,
+      "avg_time_s": 7.308028888702393,
+      "avg_llm_calls": 1.6,
+      "total_cost": 0.14863275,
+      "hit1": 1.0,
+      "hit10": 1.0
+    }
+  ],
+  "aggregate": [
+    {
+      "retriever": "Block",
+      "queries_total": 5,
+      "avg_time_s": 5.46975998878479,
+      "avg_llm_calls": 1.0,
+      "hit1": 1.0,
+      "hit10": 1.0,
+      "total_cost_usd": 0.07618710000000001
+    },
+    {
+      "retriever": "Beam",
+      "queries_total": 5,
+      "avg_time_s": 20.17977318763733,
+      "avg_llm_calls": 4.6,
+      "hit1": 0.6,
+      "hit10": 0.8,
+      "total_cost_usd": 0.132762
+    },
+    {
+      "retriever": "Vertical",
+      "queries_total": 5,
+      "avg_time_s": 7.308028888702393,
+      "avg_llm_calls": 1.6,
+      "hit1": 1.0,
+      "hit10": 1.0,
+      "total_cost_usd": 0.14863275
+    }
+  ]
+}
@@ -0,0 +1,16 @@
+# Filesystem Retriever Comparison (Block vs Beam vs Vertical)
+
+Data sources:
+- `bench/fs_block_beam_vertical_context7.json`
+
+Run setup: `fs_query_order=prefix`, `beam_size=3`, `max_turns=10`, total `5` queries on `context7` only.
+
+## Overall (5 queries: context7)
+
+| Retriever | Avg Time (s) | Avg LLM Calls | Total Cost (USD) | Hit@1 | Hit@10 |
+|---|---:|---:|---:|---:|---:|
+| Block | 5.4698 | 1.0000 | 0.0762 | 1.0000 | 1.0000 |
+| Vertical | 7.3080 | 1.6000 | 0.1486 | 1.0000 | 1.0000 |
+| Beam | 20.1798 | 4.6000 | 0.1328 | 0.6000 | 0.8000 |
+
+Conclusion: on the current `context7` filesystem set, `Block` is still the best default. It keeps perfect `Hit@1` / `Hit@10`, while staying faster and cheaper than `Vertical`. `Beam` remains cheaper than `Vertical`, but it still loses clearly on accuracy.