Fix MCP tool allowlist filtering

CodebuffAI · CodebuffAI · commit 2270ea2486e3 · 2026-04-15T02:12:13.000Z
diff --git a/sdk/src/__tests__/run-mcp-tool-filter.test.ts b/sdk/src/__tests__/run-mcp-tool-filter.test.ts
@@ -0,0 +1,124 @@
+import * as mainPromptModule from '@codebuff/agent-runtime/main-prompt'
+import { getInitialSessionState } from '@codebuff/common/types/session-state'
+import { getStubProjectFileContext } from '@codebuff/common/util/file'
+import { afterEach, describe, expect, it, mock, spyOn } from 'bun:test'
+
+import { CodebuffClient } from '../client'
+import * as mcpClientModule from '@codebuff/common/mcp/client'
+import * as databaseModule from '../impl/database'
+
+import type { AgentDefinition } from '@codebuff/common/templates/initial-agents-dir/types/agent-definition'
+import type { MCPConfig } from '@codebuff/common/types/mcp'
+
+const browserMcpConfig: MCPConfig = {
+  type: 'stdio',
+  command: 'npx',
+  args: ['-y', 'fake-mcp-server'],
+  env: {},
+}
+
+const TEST_AGENT: AgentDefinition = {
+  id: 'mcp-filter-agent',
+  displayName: 'MCP Filter Agent',
+  model: 'openai/gpt-5-mini',
+  reasoningOptions: { effort: 'minimal' },
+  mcpServers: {
+    browser: browserMcpConfig,
+  },
+  toolNames: ['browser/browser_navigate', 'browser/browser_snapshot'],
+  systemPrompt: 'Test MCP filtering.',
+}
+
+describe('MCP tool filtering', () => {
+  afterEach(() => {
+    mock.restore()
+  })
+
+  it('returns only allowlisted MCP tools when an agent restricts toolNames', async () => {
+    spyOn(databaseModule, 'getUserInfoFromApiKey').mockResolvedValue({
+      id: 'user-123',
+      email: 'test@example.com',
+      discord_id: null,
+      referral_code: null,
+      stripe_customer_id: null,
+      banned: false,
+    })
+    spyOn(databaseModule, 'fetchAgentFromDatabase').mockResolvedValue(null)
+    spyOn(databaseModule, 'startAgentRun').mockResolvedValue('run-1')
+    spyOn(databaseModule, 'finishAgentRun').mockResolvedValue(undefined)
+    spyOn(databaseModule, 'addAgentStep').mockResolvedValue('step-1')
+
+    spyOn(mcpClientModule, 'getMCPClient').mockResolvedValue('mcp-client-id')
+    spyOn(mcpClientModule, 'listMCPTools').mockResolvedValue({
+      tools: [
+        {
+          name: 'browser_navigate',
+          description: 'Navigate to a page',
+          inputSchema: { type: 'object', properties: {} },
+        },
+        {
+          name: 'browser_snapshot',
+          description: 'Capture snapshot',
+          inputSchema: { type: 'object', properties: {} },
+        },
+        {
+          name: 'browser_click',
+          description: 'Click an element',
+          inputSchema: { type: 'object', properties: {} },
+        },
+      ],
+    } as Awaited<ReturnType<typeof mcpClientModule.listMCPTools>>)
+
+    let filteredTools: Array<{ name: string }> = []
+
+    spyOn(mainPromptModule, 'callMainPrompt').mockImplementation(
+      async (params: Parameters<typeof mainPromptModule.callMainPrompt>[0]) => {
+        const { sendAction, promptId, requestMcpToolData } = params
+        const sessionState = getInitialSessionState(getStubProjectFileContext())
+
+        filteredTools = await requestMcpToolData({
+          mcpConfig: browserMcpConfig,
+          toolNames: TEST_AGENT.toolNames!
+            .filter((toolName) => toolName.startsWith('browser/'))
+            .map((toolName) => toolName.slice('browser/'.length)),
+        })
+
+        await sendAction({
+          action: {
+            type: 'prompt-response',
+            promptId,
+            sessionState,
+            output: {
+              type: 'lastMessage',
+              value: [],
+            },
+          },
+        })
+
+        return {
+          sessionState,
+          output: {
+            type: 'lastMessage' as const,
+            value: [],
+          },
+        }
+      },
+    )
+
+    const client = new CodebuffClient({
+      apiKey: 'test-key',
+      agentDefinitions: [TEST_AGENT],
+    })
+
+    const result = await client.run({
+      agent: TEST_AGENT.id,
+      prompt: 'List MCP tools',
+    })
+
+    expect(result.output.type).toBe('lastMessage')
+    expect(filteredTools.map((tool: { name: string }) => tool.name)).toEqual([
+      'browser_navigate',
+      'browser_snapshot',
+    ])
+  })
+})
diff --git a/sdk/src/run.ts b/sdk/src/run.ts
@@ -394,7 +394,7 @@ async function runOnce({
           filteredTools.push(tool)
           continue
         }
-        if (tool.name in toolNames) {
+        if (toolNames.includes(tool.name)) {
           filteredTools.push(tool)
           continue
         }

Original file line number	Diff line number	Diff line change
`@@ -394,7 +394,7 @@ async function runOnce({`
`394`	`394`	`filteredTools.push(tool)`
`395`	`395`	`continue`
`396`	`396`	`}`
`397`		`- if (tool.name in toolNames) {`
	`397`	`+ if (toolNames.includes(tool.name)) {`
`398`	`398`	`filteredTools.push(tool)`
`399`	`399`	`continue`
`400`	`400`	`}`