From 19284ddb80443ac019477bf7e3d73f325f8138ec Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Tobi=20L=C3=BCtke?= <tobi@lutke.com>
Date: Wed, 18 Feb 2026 21:50:25 -0500
Subject: [PATCH] refactor(mcp): remove deprecated search tools, keep only
 structured_search

BREAKING CHANGE: MCP tools search, vector_search, deep_search removed.
Use structured_search with lex/vec/hyde queries instead.

- Remove search, vector_search, deep_search MCP tool registrations
- Update MCP instructions to focus on structured_search
- Update skill docs to reflect simplified API
- Rename test describes to reflect they test store functions
- CLI commands (qmd search, vsearch, query) unchanged for backwards compat
---
 skills/qmd/SKILL.md                |   5 +-
 skills/qmd/references/mcp-setup.md |  33 ------
 src/mcp.ts                         | 155 ++---------------------------
 test/mcp.test.ts                   |  16 +--
 4 files changed, 20 insertions(+), 189 deletions(-)

diff --git a/skills/qmd/SKILL.md b/skills/qmd/SKILL.md
index 2386559..80e019a 100644
--- a/skills/qmd/SKILL.md
+++ b/skills/qmd/SKILL.md
@@ -120,10 +120,7 @@ Both `vec` and `hyde` use vector similarity search. The difference is input form
 
 | Tool | Speed | Use Case |
 |------|-------|----------|
-| `structured_search` | ~5s | **Recommended** — you provide query expansions |
-| `search` | ~30ms | Fast keyword lookup (BM25) |
-| `vector_search` | ~2s | Semantic similarity |
-| `deep_search` | ~10s | Auto-expands query (uses small local model) |
+| `structured_search` | ~5s | Search with lex/vec/hyde queries |
 | `get` | instant | Retrieve doc by path or `#docid` |
 | `multi_get` | instant | Retrieve multiple docs |
 | `status` | instant | Index health |
diff --git a/skills/qmd/references/mcp-setup.md b/skills/qmd/references/mcp-setup.md
index 7ce6623..154bcb9 100644
--- a/skills/qmd/references/mcp-setup.md
+++ b/skills/qmd/references/mcp-setup.md
@@ -103,39 +103,6 @@ Execute pre-expanded search queries. **Use this** — you're a capable LLM that
 
 Both `vec` and `hyde` use vector search — the difference is what you write.
 
-### search
-
-Fast BM25 keyword search (~30ms).
-
-| Parameter | Type | Description |
-|-----------|------|-------------|
-| `query` | string | Search query |
-| `collection` | string? | Filter by collection |
-| `limit` | number? | Max results (default: 5) |
-| `minScore` | number? | Min relevance 0-1 |
-
-### vector_search
-
-Semantic similarity search (~2s).
-
-| Parameter | Type | Description |
-|-----------|------|-------------|
-| `query` | string | Natural language query |
-| `collection` | string? | Filter by collection |
-| `limit` | number? | Max results (default: 5) |
-| `minScore` | number? | Min relevance 0-1 |
-
-### deep_search
-
-Hybrid search with automatic query expansion (~10s). Uses a small local model to expand your query. **Prefer `structured_search`** — you generate better expansions.
-
-| Parameter | Type | Description |
-|-----------|------|-------------|
-| `query` | string | Search query |
-| `collection` | string? | Filter by collection |
-| `limit` | number? | Max results (default: 5) |
-| `minScore` | number? | Min relevance 0-1 |
-
 ### get
 
 Retrieve a document by path or docid.
diff --git a/src/mcp.ts b/src/mcp.ts
index 02807c7..274b6a1 100644
--- a/src/mcp.ts
+++ b/src/mcp.ts
@@ -19,8 +19,6 @@ import {
   createStore,
   extractSnippet,
   addLineNumbers,
-  hybridQuery,
-  vectorSearchQuery,
   structuredSearch,
   DEFAULT_MULTI_GET_MAX_BYTES,
 } from "./store.js";
@@ -114,25 +112,23 @@ function buildInstructions(store: Store): string {
   // --- Capability gaps ---
   if (!status.hasVectorIndex) {
     lines.push("");
-    lines.push("Note: No vector embeddings. Only `search` (BM25) is available.");
+    lines.push("Note: No vector embeddings yet. Run `qmd embed` to enable semantic search (vec/hyde).");
   } else if (status.needsEmbedding > 0) {
     lines.push("");
     lines.push(`Note: ${status.needsEmbedding} documents need embedding. Run \`qmd embed\` to update.`);
   }
 
-  // --- When to use which tool (escalation ladder) ---
-  // Tool schemas describe parameters; instructions describe strategy.
+  // --- Search tool ---
   lines.push("");
-  lines.push("Search:");
-  lines.push("  - `search` (~30ms) — BM25 keyword matching. Fast, exact terms.");
-  lines.push("  - `vector_search` (~2s) — semantic search. Finds synonyms and related concepts.");
-  lines.push("  - `deep_search` (~10s) — auto-expands query + reranks. Use when you don't know the exact terms.");
-  lines.push("  - `structured_search` (~5s) — YOU provide the query variations. Best for complex/nuanced queries.");
+  lines.push("Search: Use `structured_search` with 1-4 sub-queries:");
+  lines.push("  - type:'lex' — BM25 keyword search (exact terms, fast)");
+  lines.push("  - type:'vec' — semantic vector search (meaning-based)");
+  lines.push("  - type:'hyde' — hypothetical document (write what the answer looks like)");
   lines.push("");
-  lines.push("For structured_search, pass 2-4 sub-searches:");
-  lines.push("  - type:'lex' for keyword phrases (BM25)");
-  lines.push("  - type:'vec' for semantic questions");
-  lines.push("  - type:'hyde' for hypothetical answer snippets");
+  lines.push("Examples:");
+  lines.push("  Quick keyword lookup: [{type:'lex', query:'error handling'}]");
+  lines.push("  Semantic search: [{type:'vec', query:'how to handle errors gracefully'}]");
+  lines.push("  Best results: [{type:'lex', query:'error'}, {type:'vec', query:'error handling best practices'}]");
 
   // --- Retrieval workflow ---
   lines.push("");
@@ -229,136 +225,7 @@ function createMcpServer(store: Store): McpServer {
   );
 
   // ---------------------------------------------------------------------------
-  // Tool: qmd_search (keyword)
-  // ---------------------------------------------------------------------------
-
-  server.registerTool(
-    "search",
-    {
-      title: "Keyword Search",
-      description: "Search by keyword. Finds documents containing exact words and phrases in the query.",
-      annotations: { readOnlyHint: true, openWorldHint: false },
-      inputSchema: {
-        query: z.string().describe("Search query - keywords or phrases to find"),
-        limit: z.number().optional().default(10).describe("Maximum number of results (default: 10)"),
-        minScore: z.number().optional().default(0).describe("Minimum relevance score 0-1 (default: 0)"),
-        collection: z.string().optional().describe("Filter to a specific collection by name"),
-      },
-    },
-    async ({ query, limit, minScore, collection }) => {
-      const results = store.searchFTS(query, limit || 10, collection);
-      const filtered: SearchResultItem[] = results
-        .filter(r => r.score >= (minScore || 0))
-        .map(r => {
-          const { line, snippet } = extractSnippet(r.body || "", query, 300, r.chunkPos);
-          return {
-            docid: `#${r.docid}`,
-            file: r.displayPath,
-            title: r.title,
-            score: Math.round(r.score * 100) / 100,
-            context: store.getContextForFile(r.filepath),
-            snippet: addLineNumbers(snippet, line),  // Default to line numbers
-          };
-        });
-
-      return {
-        content: [{ type: "text", text: formatSearchSummary(filtered, query) }],
-        structuredContent: { results: filtered },
-      };
-    }
-  );
-
-  // ---------------------------------------------------------------------------
-  // Tool: qmd_vector_search (Vector semantic search)
-  // ---------------------------------------------------------------------------
-
-  server.registerTool(
-    "vector_search",
-    {
-      title: "Vector Search",
-      description: "Search by meaning. Finds relevant documents even when they use different words than the query — handles synonyms, paraphrases, and related concepts.",
-      annotations: { readOnlyHint: true, openWorldHint: false },
-      inputSchema: {
-        query: z.string().describe("Natural language query - describe what you're looking for"),
-        limit: z.number().optional().default(10).describe("Maximum number of results (default: 10)"),
-        minScore: z.number().optional().default(0.3).describe("Minimum relevance score 0-1 (default: 0.3)"),
-        collection: z.string().optional().describe("Filter to a specific collection by name"),
-      },
-    },
-    async ({ query, limit, minScore, collection }) => {
-      const results = await vectorSearchQuery(store, query, { collection, limit, minScore });
-
-      if (results.length === 0) {
-        // Distinguish "no embeddings" from "no matches" — check if vector table exists
-        const tableExists = store.db.prepare(`SELECT name FROM sqlite_master WHERE type='table' AND name='vectors_vec'`).get();
-        if (!tableExists) {
-          return {
-            content: [{ type: "text", text: "Vector index not found. Run 'qmd embed' first to create embeddings." }],
-            isError: true,
-          };
-        }
-      }
-
-      const filtered: SearchResultItem[] = results.map(r => {
-        const { line, snippet } = extractSnippet(r.body, query, 300);
-        return {
-          docid: `#${r.docid}`,
-          file: r.displayPath,
-          title: r.title,
-          score: Math.round(r.score * 100) / 100,
-          context: r.context,
-          snippet: addLineNumbers(snippet, line),
-        };
-      });
-
-      return {
-        content: [{ type: "text", text: formatSearchSummary(filtered, query) }],
-        structuredContent: { results: filtered },
-      };
-    }
-  );
-
-  // ---------------------------------------------------------------------------
-  // Tool: qmd_deep_search (Deep search with expansion + reranking)
-  // ---------------------------------------------------------------------------
-
-  server.registerTool(
-    "deep_search",
-    {
-      title: "Deep Search",
-      description: "Deep search. Auto-expands the query into variations, searches each by keyword and meaning, and reranks for top hits across all results.",
-      annotations: { readOnlyHint: true, openWorldHint: false },
-      inputSchema: {
-        query: z.string().describe("Natural language query - describe what you're looking for"),
-        limit: z.number().optional().default(10).describe("Maximum number of results (default: 10)"),
-        minScore: z.number().optional().default(0).describe("Minimum relevance score 0-1 (default: 0)"),
-        collection: z.string().optional().describe("Filter to a specific collection by name"),
-      },
-    },
-    async ({ query, limit, minScore, collection }) => {
-      const results = await hybridQuery(store, query, { collection, limit, minScore });
-
-      const filtered: SearchResultItem[] = results.map(r => {
-        const { line, snippet } = extractSnippet(r.bestChunk, query, 300);
-        return {
-          docid: `#${r.docid}`,
-          file: r.displayPath,
-          title: r.title,
-          score: Math.round(r.score * 100) / 100,
-          context: r.context,
-          snippet: addLineNumbers(snippet, line),
-        };
-      });
-
-      return {
-        content: [{ type: "text", text: formatSearchSummary(filtered, query) }],
-        structuredContent: { results: filtered },
-      };
-    }
-  );
-
-  // ---------------------------------------------------------------------------
-  // Tool: qmd_structured_search (Pre-expanded queries from LLM)
+  // Tool: structured_search (Primary search tool)
   // ---------------------------------------------------------------------------
 
   const subSearchSchema = z.object({
diff --git a/test/mcp.test.ts b/test/mcp.test.ts
index e09df8b..ba20164 100644
--- a/test/mcp.test.ts
+++ b/test/mcp.test.ts
@@ -257,7 +257,7 @@ describe("MCP Server", () => {
   // Tool: qmd_search (BM25)
   // ===========================================================================
 
-  describe("qmd_search tool", () => {
+  describe("searchFTS (BM25 keyword search)", () => {
     test("returns results for matching query", () => {
       const results = searchFTS(testDb, "readme", 10);
       expect(results.length).toBeGreaterThan(0);
@@ -295,10 +295,10 @@ describe("MCP Server", () => {
   });
 
   // ===========================================================================
-  // Tool: qmd_vector_search (Vector)
+  // searchVec (Vector similarity search)
   // ===========================================================================
 
-  describe.skipIf(!!process.env.CI)("qmd_vector_search tool", () => {
+  describe.skipIf(!!process.env.CI)("searchVec (vector similarity)", () => {
     test("returns results for semantic query", async () => {
       const results = await searchVec(testDb, "project documentation", DEFAULT_EMBED_MODEL, 10);
       expect(results.length).toBeGreaterThan(0);
@@ -321,10 +321,10 @@ describe("MCP Server", () => {
   });
 
   // ===========================================================================
-  // Tool: qmd_deep_search (Deep search)
+  // hybridQuery (query expansion + reranking)
   // ===========================================================================
 
-  describe.skipIf(!!process.env.CI)("qmd_deep_search tool", () => {
+  describe.skipIf(!!process.env.CI)("hybridQuery (expansion + reranking)", () => {
     test("expands query with typed variations", async () => {
       const expanded = await expandQuery("api documentation", DEFAULT_QUERY_MODEL, testDb);
       // Returns ExpandedQuery[] — typed expansions, original excluded
@@ -1008,12 +1008,12 @@ describe("MCP HTTP Transport", () => {
     expect(contentType).toContain("application/json");
 
     const toolNames = json.result.tools.map((t: any) => t.name);
-    expect(toolNames).toContain("search");
+    expect(toolNames).toContain("structured_search");
     expect(toolNames).toContain("get");
     expect(toolNames).toContain("status");
   });
 
-  test("POST /mcp tools/call search returns results", async () => {
+  test("POST /mcp tools/call structured_search returns results", async () => {
     // Initialize
     await mcpRequest({
       jsonrpc: "2.0", id: 1, method: "initialize",
@@ -1022,7 +1022,7 @@ describe("MCP HTTP Transport", () => {
 
     const { status, json } = await mcpRequest({
       jsonrpc: "2.0", id: 3, method: "tools/call",
-      params: { name: "search", arguments: { query: "readme" } },
+      params: { name: "structured_search", arguments: { searches: [{ type: "lex", query: "readme" }] } },
     });
     expect(status).toBe(200);
     expect(json.result).toBeDefined();