refactor: filter_tools/GraphToolkit 최상위 export — LangChain 의존 없이 from graph_tool_call import filter_tools

SonAIengine · claude · SonAIengine · commit 08a860083584 · 2026-03-23T17:13:45.000+09:00
- toolkit.py를 graph_tool_call/ 최상위로 이동 (langchain 패키지 의존 제거)
- `from graph_tool_call import filter_tools, GraphToolkit` 가능
- 기존 `from graph_tool_call.langchain import ...` 경로도 호환 유지
- README: "Wrap Existing Tools" 독립 섹션 분리, LangChain 전용은 별도로

Co-Authored-By: Claude Opus 4.6 (1M context) &lt;noreply@anthropic.com&gt;
diff --git a/README.md b/README.md
@@ -489,54 +489,59 @@ from graph_tool_call.middleware import patch_anthropic
 patch_anthropic(client, graph=tg, top_k=5)
 ```
 
-### LangChain Integration
-
-```bash
-pip install graph-tool-call[langchain]
-```
+### Wrap Existing Tools (any format)
 
-**Wrap existing tools** — filter any tool list down to relevant ones:
+Already have a tool list? Wrap it with `filter_tools` — **no extra dependencies**, works with any format:
 
 ```python
-from graph_tool_call.langchain import filter_tools
+from graph_tool_call import filter_tools
 
-# Works with any tool format:
-# - LangChain BaseTool (@tool, StructuredTool, etc.)
-# - OpenAI function dicts ({"type": "function", "function": {...}})
-# - MCP tool dicts ({"name": ..., "inputSchema": ...})
-# - Python functions with type hints
+# Accepts any tool format:
+#   LangChain BaseTool, OpenAI function dicts, MCP tool dicts,
+#   Anthropic tool dicts, or plain Python functions
 
 filtered = filter_tools(all_tools, "send an email to John", top_k=5)
-
-agent = create_react_agent(llm, filtered)
-agent.invoke({"input": "send an email to John"})
+# → only the 5 most relevant tools, original objects preserved
 ```
 
 **Reusable toolkit** — build the graph once, filter per query:
 
 ```python
-from graph_tool_call.langchain import GraphToolkit
+from graph_tool_call import GraphToolkit
 
 toolkit = GraphToolkit(tools=all_tools, top_k=5)
 
-# Each call returns only relevant tools — original objects preserved
 tools_a = toolkit.get_tools("cancel my order")
 tools_b = toolkit.get_tools("check the weather")
 
 # Access the underlying ToolGraph for advanced config
 toolkit.graph.enable_embedding("ollama/qwen3-embedding:0.6b")
 ```
 
+### LangChain Integration
+
+```bash
+pip install graph-tool-call[langchain]
+```
+
+`filter_tools` / `GraphToolkit` work directly with LangChain agents:
+
+```python
+from graph_tool_call import filter_tools
+
+filtered = filter_tools(langchain_tools, "cancel order", top_k=5)
+agent = create_react_agent(llm, filtered)
+```
+
 <details>
-<summary>Retriever (returns Documents instead of tools)</summary>
+<summary>LangChain Retriever (returns Documents instead of tools)</summary>
 
 ```python
 from graph_tool_call import ToolGraph
 from graph_tool_call.langchain import GraphToolRetriever
 
 tg = ToolGraph.from_url("https://api.example.com/openapi.json")
 
-# Use as a LangChain retriever — compatible with any chain/agent
 retriever = GraphToolRetriever(tool_graph=tg, top_k=5)
 docs = retriever.invoke("cancel an order")
 
diff --git a/graph_tool_call/__init__.py b/graph_tool_call/__init__.py
@@ -8,6 +8,7 @@
     "CategorySummary",
     "DuplicatePair",
     "GraphAnalysisReport",
+    "GraphToolkit",
     "MCPAnnotations",
     "MergeStrategy",
     "NodeType",
@@ -20,6 +21,7 @@
     "ToolCallPolicy",
     "ToolGraph",
     "ToolSchema",
+    "filter_tools",
     "parse_tool",
 ]
 
@@ -36,6 +38,8 @@
     "ToolCallPolicy": ("graph_tool_call.assist.policy", "ToolCallPolicy"),
     "RetrievalResult": ("graph_tool_call.retrieval.engine", "RetrievalResult"),
     "SearchMode": ("graph_tool_call.retrieval.engine", "SearchMode"),
+    "filter_tools": ("graph_tool_call.toolkit", "filter_tools"),
+    "GraphToolkit": ("graph_tool_call.toolkit", "GraphToolkit"),
 }
 
 
diff --git a/graph_tool_call/langchain/__init__.py b/graph_tool_call/langchain/__init__.py
@@ -10,8 +10,8 @@
 
 _LAZY_IMPORTS: dict[str, tuple[str, str]] = {
     "GraphToolRetriever": ("graph_tool_call.langchain.retriever", "GraphToolRetriever"),
-    "GraphToolkit": ("graph_tool_call.langchain.toolkit", "GraphToolkit"),
-    "filter_tools": ("graph_tool_call.langchain.toolkit", "filter_tools"),
+    "GraphToolkit": ("graph_tool_call.toolkit", "GraphToolkit"),
+    "filter_tools": ("graph_tool_call.toolkit", "filter_tools"),
     "langchain_tools_to_schemas": ("graph_tool_call.langchain.tools", "langchain_tools_to_schemas"),
     "tool_schema_to_openai_function": (
         "graph_tool_call.langchain.tools",
diff --git a/graph_tool_call/toolkit.py b/graph_tool_call/toolkit.py
@@ -0,0 +1,206 @@
+"""Toolkit: wrap existing tools with graph-based filtering.
+
+Provides :func:`filter_tools` for one-shot filtering and
+:class:`GraphToolkit` for reusable tool management with retrieval.
+
+Accepts any tool format:
+- LangChain ``BaseTool`` (``@tool``, ``StructuredTool``, etc.)
+- OpenAI function dict (``{"type": "function", "function": {"name": ...}}``)
+- Anthropic tool dict (``{"name": ..., "input_schema": ...}``)
+- MCP tool dict (``{"name": ..., "inputSchema": ...}``)
+- Python callable with type hints
+
+Usage::
+
+    from graph_tool_call.langchain import filter_tools, GraphToolkit
+
+    # One-shot: filter tools by query
+    filtered = filter_tools(all_tools, "cancel order", top_k=5)
+
+    # Reusable: wrap once, filter many times
+    toolkit = GraphToolkit(tools=all_tools, top_k=5)
+    filtered = toolkit.get_tools("cancel order")
+"""
+
+from __future__ import annotations
+
+import logging
+from typing import Any
+
+logger = logging.getLogger("graph-tool-call.langchain")
+
+
+def _extract_name(tool: Any) -> str:
+    """Extract tool name from any supported format."""
+    # Object with .name attribute (LangChain BaseTool, ToolSchema, etc.)
+    if hasattr(tool, "name"):
+        return tool.name
+
+    # Dict formats
+    if isinstance(tool, dict):
+        # OpenAI: {"type": "function", "function": {"name": ...}}
+        if "function" in tool:
+            return tool["function"].get("name", "")
+        # MCP / Anthropic: {"name": ...}
+        if "name" in tool:
+            return tool["name"]
+
+    # Callable (Python function)
+    if callable(tool):
+        return getattr(tool, "__name__", "")
+
+    return ""
+
+
+def _ingest_tools(graph: Any, tools: list[Any]) -> None:
+    """Ingest tools into a ToolGraph, auto-detecting format."""
+    from graph_tool_call.core.tool import parse_tool
+
+    callables = []
+    for tool in tools:
+        if callable(tool) and not hasattr(tool, "name") and not isinstance(tool, dict):
+            callables.append(tool)
+        else:
+            graph.add_tool(parse_tool(tool))
+
+    if callables:
+        graph.ingest_functions(callables)
+
+
+def filter_tools(
+    tools: list[Any],
+    query: str,
+    *,
+    top_k: int = 5,
+    graph: Any | None = None,
+) -> list[Any]:
+    """Filter tools by relevance to *query*.
+
+    Parameters
+    ----------
+    tools:
+        List of tools in any format — LangChain ``BaseTool``, OpenAI function
+        dicts, MCP tool dicts, Anthropic tool dicts, or Python callables.
+    query:
+        Natural-language query to match tools against.
+    top_k:
+        Maximum number of tools to return (default: 5).
+    graph:
+        Optional pre-built ``ToolGraph``. If *None*, a temporary graph is
+        built from *tools* on the fly.
+
+    Returns
+    -------
+    list
+        Subset of *tools* ranked by relevance. Original tool objects are
+        preserved (not copies), so they remain callable by the agent.
+    """
+    from graph_tool_call import ToolGraph
+
+    if graph is None:
+        graph = ToolGraph()
+
+    # Index by name for fast lookup
+    tool_map: dict[str, Any] = {}
+    for t in tools:
+        name = _extract_name(t)
+        if name:
+            tool_map[name] = t
+
+    # Ingest if not already present
+    existing = set(graph.tools.keys())
+    if not existing.intersection(tool_map.keys()):
+        _ingest_tools(graph, tools)
+
+    results = graph.retrieve(query, top_k=top_k)
+    result_names = [r.name for r in results]
+
+    filtered = [tool_map[name] for name in result_names if name in tool_map]
+
+    if filtered:
+        logger.debug(
+            "Filtered %d → %d tools for query: %s",
+            len(tools),
+            len(filtered),
+            query[:50],
+        )
+        return filtered
+
+    logger.debug("Retrieval returned no matches, returning all %d tools", len(tools))
+    return list(tools)
+
+
+class GraphToolkit:
+    """Wraps a list of tools with graph-based retrieval.
+
+    Build once from existing tools, then call :meth:`get_tools` per query.
+
+    Parameters
+    ----------
+    tools:
+        List of tools in any format — LangChain ``BaseTool``, OpenAI function
+        dicts, MCP tool dicts, Anthropic tool dicts, or Python callables.
+    top_k:
+        Default number of tools to return per query.
+    graph:
+        Optional pre-built ``ToolGraph``. If *None*, one is built from *tools*.
+    """
+
+    def __init__(
+        self,
+        tools: list[Any],
+        *,
+        top_k: int = 5,
+        graph: Any | None = None,
+    ) -> None:
+        from graph_tool_call import ToolGraph
+
+        self._tools: dict[str, Any] = {}
+        for t in tools:
+            name = _extract_name(t)
+            if name:
+                self._tools[name] = t
+
+        self._top_k = top_k
+
+        if graph is not None:
+            self._graph: ToolGraph = graph
+        else:
+            self._graph = ToolGraph()
+
+        # Ingest tools into graph
+        existing = set(self._graph.tools.keys())
+        if not existing.intersection(self._tools.keys()):
+            _ingest_tools(self._graph, tools)
+
+    @property
+    def graph(self) -> Any:
+        """Underlying ``ToolGraph`` instance."""
+        return self._graph
+
+    @property
+    def all_tools(self) -> list[Any]:
+        """All registered tools."""
+        return list(self._tools.values())
+
+    def get_tools(self, query: str, *, top_k: int | None = None) -> list[Any]:
+        """Return tools relevant to *query*.
+
+        Parameters
+        ----------
+        query:
+            Natural-language query.
+        top_k:
+            Override the default top_k for this call.
+
+        Returns
+        -------
+        list
+            Filtered tools, ordered by relevance. Original objects preserved.
+        """
+        k = top_k if top_k is not None else self._top_k
+        results = self._graph.retrieve(query, top_k=k)
+        result_names = [r.name for r in results]
+
+        filtered = [self._tools[name] for name in result_names if name in self._tools]
+        return filtered if filtered else self.all_tools
diff --git a/tests/test_langchain_toolkit.py b/tests/test_langchain_toolkit.py