synaptic-memory/src/synaptic/agent_tools_v2.py at main · PlateerLab/synaptic-memory · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
"""V2 agent tools — compound tools that chain multiple primitives.

The v1 tools (``agent_tools.py``) are atomic: one tool = one operation.
The agent has to orchestrate them across multiple turns. This works but
is expensive — a complex query like "인권경영과 예산 편성의 관계" takes
6-10 turns because the agent has to:

    search → list_categories → search(cat) → get_doc → search(cat2) → get_doc2

The v2 tools solve this by **chaining internally**:

- ``deep_search``: search → auto-expand top hits → read relevant chunks
  → return a comprehensive result in ONE turn.
- ``compare``: decompose a multi-entity query → parallel search each →
  merge results.

These compound tools call the v1 primitives internally via
``asyncio.gather`` for parallelism. The agent sees them as single tools
that return richer results.

Typical turn reduction: 6-10 turns → 1-3 turns.
"""

from __future__ import annotations

import asyncio
import logging
from typing import TYPE_CHECKING

from synaptic.agent_tools import (
    Hint,
    ToolResult,
    _budget_check,
    expand_tool,
    get_document_tool,
    search_tool,
)
from synaptic.search_session import SearchSession

if TYPE_CHECKING:
    from synaptic.protocols import StorageBackend

logger = logging.getLogger("agent-tools-v2")


async def deep_search_tool(
    backend: StorageBackend,
    session: SearchSession,
    query: str,
    *,
    limit: int = 5,
    category: str | None = None,
    read_top_k: int = 2,
    embedder: object | None = None,
    reranker: object | None = None,
) -> ToolResult:
    """One-turn deep search: search → expand → read documents.

    Chains three v1 primitives internally:
    1. ``search`` with the query (+ optional category filter)
    2. ``expand`` the top hit to discover neighbours
    3. ``get_document`` on the top-k results with query-aware chunking

    Returns a single consolidated result: evidence list + expanded
    neighbours + document excerpts — all in one turn instead of 3-5.

    Args:
        backend: Storage backend.
        session: Active search session.
        query: User query.
        limit: Max evidence items from the initial search.
        category: Optional category filter.
        read_top_k: How many top documents to read in full.
        embedder: Optional embedder for EvidenceSearch.
        reranker: Optional cross-encoder reranker.
    """
    budget = _budget_check(session, "deep_search")
    if budget is not None:
        return budget

    session.record_query(query)

    # Step 1: search
    search_result = await search_tool(
        backend,
        session,
        query,
        limit=limit,
        category=category,
        embedder=embedder,
    )
    evidence = search_result.data.get("evidence", [])

    # Step 2: expand top hit (parallel with step 3)
    expanded_neighbours: list[dict] = []
    doc_excerpts: list[dict] = []

    if evidence:
        top_node_id = evidence[0].get("id", "")
        top_doc_ids = list(
            dict.fromkeys(e.get("document_id", "") for e in evidence if e.get("document_id"))
        )[:read_top_k]

        # Parallel: expand + get_documents
        tasks = []
        # Expand top hit
        if top_node_id:
            tasks.append(_safe_expand(backend, session, top_node_id))
        # Read top documents
        for doc_id in top_doc_ids:
            tasks.append(_safe_get_doc(backend, session, doc_id, query))

        results = await asyncio.gather(*tasks)

        for r in results:
            if r is None:
                continue
            if r.tool == "expand" and r.ok:
                expanded_neighbours = r.data.get("neighbours", [])
            elif r.tool == "get_document" and r.ok:
                doc_excerpts.append(
                    {
                        "document": r.data.get("document", {}),
                        "relevant_chunks": [
                            c for c in r.data.get("chunks", []) if c.get("relevant")
                        ],
                        "total_chunks": r.data.get("chunk_count", 0),
                    }
                )

    # Build consolidated response
    hints: list[Hint] = []
    if not evidence:
        # Decompose the query into its first content word and suggest
        # a FTS fallback. "try a different category" as a literal arg
        # (the prior hint) was being copied verbatim by the LLM and
        # failing — executable hints work, meta-hints don't.
        tokens = [t for t in query.split() if len(t) >= 2]
        if tokens:
            hints.append(
                Hint(
                    action="search",
                    args={"query": tokens[0]},
                    reason=(
                        "deep_search found nothing — retry plain FTS on the "
                        "first keyword alone; often the full question phrase "
                        "over-constrains BM25"
                    ),
                )
            )
        hints.append(
            Hint(
                action="list_categories",
                args={},
                reason="inspect available categories, then retry deep_search with category= filter",
            )
        )

    return ToolResult(
        tool="deep_search",
        ok=True,
        data={
            "evidence": evidence,
            "expanded_neighbours": expanded_neighbours[:5],
            "document_excerpts": doc_excerpts,
            "search_anchors": search_result.data.get("anchors", {}),
        },
        hints=hints,
        session=session.summary(),
    )


async def compare_search_tool(
    backend: StorageBackend,
    session: SearchSession,
    query: str,
    *,
    embedder: object | None = None,
) -> ToolResult:
    """Decompose a multi-topic query and search each in parallel.

    Splits queries containing "과", "와", "및", "관련", "관계" into
    sub-queries, searches each with category filtering, and merges
    results. Solves cross-document queries in 1 turn instead of 4-6.

    Example:
        "인권경영과 예산 편성의 관계"
        → sub1: search("인권경영")
        → sub2: search("예산 편성")
        → merge: both result sets with cross-references
    """
    budget = _budget_check(session, "compare_search")
    if budget is not None:
        return budget

    session.record_query(query)

    # Decompose query
    sub_queries = _decompose_query(query)

    if len(sub_queries) <= 1:
        # Not decomposable — fall back to regular deep_search
        return await deep_search_tool(backend, session, query, embedder=embedder)

    # Parallel search for each sub-query
    tasks = [search_tool(backend, session, sq, limit=5, embedder=embedder) for sq in sub_queries]
    results = await asyncio.gather(*tasks)

    # Merge results
    all_evidence: list[dict] = []
    sub_results: list[dict] = []
    for sq, r in zip(sub_queries, results):
        evidence = r.data.get("evidence", []) if r.ok else []
        sub_results.append(
            {
                "sub_query": sq,
                "evidence_count": len(evidence),
                "top_result": evidence[0] if evidence else None,
            }
        )
        all_evidence.extend(evidence)

    # Deduplicate by node id
    seen_ids: set[str] = set()
    unique_evidence: list[dict] = []
    for e in all_evidence:
        eid = e.get("id", "")
        if eid not in seen_ids:
            seen_ids.add(eid)
            unique_evidence.append(e)

    return ToolResult(
        tool="compare_search",
        ok=True,
        data={
            "original_query": query,
            "sub_queries": sub_results,
            "merged_evidence": unique_evidence[:10],
        },
        hints=[],
        session=session.summary(),
    )


# --- Helpers ---


def _decompose_query(query: str) -> list[str]:
    """Split a compound query into sub-queries by Korean conjunctions.

    "인권경영과 예산 편성의 관계" → ["인권경영", "예산 편성"]
    "승마 행사 및 대회 계획" → ["승마 행사", "대회 계획"]

    Returns the original query as a single-element list if no
    conjunction is found — the caller treats it as non-decomposable.
    """
    import re

    # Korean conjunctions that signal multi-topic queries
    parts = re.split(r"(?:과|와|및|그리고)\s+", query)
    # Clean up trailing particles
    cleaned = []
    for p in parts:
        p = re.sub(
            r"(의\s+관계|의\s+연관|에\s+대해|에\s+미치는|을\s+비교|를\s+비교)$", "", p
        ).strip()
        if len(p) >= 2:
            cleaned.append(p)

    if len(cleaned) < 2:
        return [query]
    return cleaned


async def _safe_expand(
    backend: StorageBackend,
    session: SearchSession,
    node_id: str,
) -> ToolResult | None:
    """Expand with error swallowing."""
    try:
        return await expand_tool(backend, session, node_id, limit=5)
    except Exception:
        return None


async def _safe_get_doc(
    backend: StorageBackend,
    session: SearchSession,
    doc_id: str,
    query: str,
) -> ToolResult | None:
    """Get document with error swallowing."""
    try:
        return await get_document_tool(
            backend,
            session,
            doc_id,
            query=query,
            max_full_chunks=3,
        )
    except Exception:
        return None