move format-specific adapters to examples/, purge format-specific MCP tools

2026-07-01 10:36:14 +02:00 · 2026-07-01 10:36:14 +02:00 · d7477344a6
commit d7477344a6
parent 25d844d1f9
3 changed files with 2 additions and 84 deletions
--- a/bex/mcp_server.py
+++ b/bex/mcp_server.py
@ -1,20 +1,14 @@
-"""Grammar Inference Engine — MCP server.
+"""Dervish — MCP server.
 Provides tools to infer regular expression grammars from example sequences.
 Run as: python -m bex.mcp_server
 """
 import json
 import sys
 from pathlib import Path
 from typing import Any
 from mcp.server.fastmcp import FastMCP
 from .crx import CRX
 from .idregex import idregex
 from .ensemble import infer_ensemble, _matches
 from .yaml_to_seq import yaml_file_to_sequence, sequences_to_crx
 mcp = FastMCP("grammar-inference", log_level="ERROR")
@ -54,8 +48,7 @@ def infer_best_grammar(
    N: int = 3,
 ) -> str:
    """Infer a compact grammar from example sequences. Use this when you
-    need to generate structured content (Ansible roles, CI configs, Helm
+    have examples of sequential data and want to learn the pattern.
    values, YAML configs, etc.) and have existing examples to learn from.
    The grammar compresses N examples into ~100 chars — far fewer tokens
    than passing all examples. Pass the existing sequences, get back a
@ -92,81 +85,6 @@ def infer_best_grammar(
    return "\n".join(lines)
@mcp.tool()
 def infer_yaml_grammar(
    yaml_dir: str,
    pattern: str = "**/*.yml",
    method: str = "crx",
 ) -> str:
    """Infer a grammar from YAML files by converting them to key-path sequences.
    Each YAML file is converted to a sequence of key paths (DFS traversal).
    CRX then learns the common pattern across all files.
    Args:
        yaml_dir: Root directory to search for YAML files.
        pattern: Glob pattern for YAML files (default: **/*.yml).
        method: Algorithm to use ('crx' or 'idregex').
    Returns:
        A regular expression grammar describing the YAML structure.
    """
    files = sorted(Path(yaml_dir).rglob(pattern))
    sequences = []
    for f in files:
        if f.is_file():
            try:
                seq = yaml_file_to_sequence(f)
                if seq:
                    sequences.append(seq)
            except Exception:
                continue
    if not sequences:
        return "ε (no sequences found)"
    if method == "crx":
        return CRX().infer(sequences)
    else:
        result = idregex(sequences, kmax=2, N=3)
        return result or "∅"
@mcp.tool()
 def infer_ansible_role_grammar(roles_dir: str = ".") -> str:
    """Infer grammars from Ansible role task module sequences.
    Reads tasks/main.yml from each role, extracts the sequence of
    Ansible module names, groups roles by category prefix, and learns
    a per-category grammar.
    Args:
        roles_dir: Path to the Ansible roles directory.
    Returns:
        A formatted report with per-category grammars and role listings.
    """
    try:
        from .role_grammar import collect_all_role_sequences, learn_grammar
    except ImportError:
        return "role_grammar module not available"
    all_roles, by_category = collect_all_role_sequences(roles_dir)
    if not all_roles:
        return "No roles found."
    lines = [f"Found {len(all_roles)} roles in {len(by_category)} categories\n"]
    for cat in sorted(by_category.keys()):
        items = by_category[cat]
        seqs = [s for _, s in items]
        lines.append(f"── {cat} ({len(items)} roles) ──")
        if len(items) > 1:
            g = learn_grammar(seqs)
            lines.append(f"  Grammar: {g}")
        name, seq = items[0]
        lines.append(f"  Roles: {', '.join(n for n, _ in items)}")
        lines.append("")
    return "\n".join(lines)
 def main():
    mcp.run()
--- a/examples/role_grammar.py
+++ b/examples/role_grammar.py
--- a/examples/yaml_to_seq.py
+++ b/examples/yaml_to_seq.py