UltrafastSecp256k1/scripts/query_graph.py

#!/usr/bin/env python3
"""
query_graph.py  --  Query the UltrafastSecp256k1 Project Knowledge Graph

Lightweight CLI for AI agents and developers to query the SQLite project graph.

Usage Examples:
    python3 scripts/query_graph.py search "schnorr sign"
    python3 scripts/query_graph.py file cpu/src/ecdsa.cpp
    python3 scripts/query_graph.py subsystem ecdsa
    python3 scripts/query_graph.py deps cpu/src/musig2.cpp
    python3 scripts/query_graph.py rdeps secp256k1/schnorr.hpp
    python3 scripts/query_graph.py abi ecdsa
    python3 scripts/query_graph.py test ethereum
    python3 scripts/query_graph.py layer ct
    python3 scripts/query_graph.py function ufsecp_ecdsa_sign
    python3 scripts/query_graph.py audit protocol
    python3 scripts/query_graph.py platform x86_64
    python3 scripts/query_graph.py methods FieldElement
    python3 scripts/query_graph.py security ct_sign.cpp
    python3 scripts/query_graph.py routing ecdsa_sign
    python3 scripts/query_graph.py bindings rust
    python3 scripts/query_graph.py macros size_constant
    python3 scripts/query_graph.py impact cpu/src/ct_sign.cpp
    python3 scripts/query_graph.py context cpu/src/ecdsa.cpp
    python3 scripts/query_graph.py gaps
    python3 scripts/query_graph.py summary
    python3 scripts/query_graph.py sql "SELECT * FROM error_codes"
    python3 scripts/query_graph.py callgraph ecdsa_sign
    python3 scripts/query_graph.py hotspots 10
    python3 scripts/query_graph.py dead
    python3 scripts/query_graph.py aliases ecdsa_sign
    python3 scripts/query_graph.py coverage field_mul
    python3 scripts/query_graph.py config cmake_option
"""

import sqlite3
import sys
import json
from pathlib import Path

SCRIPT_DIR = Path(__file__).resolve().parent
LIB_ROOT = SCRIPT_DIR.parent
DB_PATH = LIB_ROOT / ".project_graph.db"

def get_conn():
    if not DB_PATH.exists():
        print(f"ERROR: Database not found at {DB_PATH}")
        print(f"Run: python3 {SCRIPT_DIR}/build_project_graph.py")
        sys.exit(1)
    conn = sqlite3.connect(str(DB_PATH))
    conn.row_factory = sqlite3.Row
    return conn

def cmd_search(query: str):
    """Full-text search across files, functions, docs, methods, and routing."""
    conn = get_conn()
    # Convert space-separated words to OR for FTS5
    fts_query = ' OR '.join(query.split())
    print(f"=== Search: {query} ===\n")

    # Files
    rows = conn.execute("SELECT path, category, subsystem, layer FROM fts_files WHERE fts_files MATCH ?", (fts_query,)).fetchall()
    if rows:
        print(f"FILES ({len(rows)}):")
        for r in rows:
            print(f"  [{r['layer'] or '?':4s}] {r['path']}  ({r['category']}, {r['subsystem'] or '-'})")

    # Functions
    rows = conn.execute("SELECT name, category, layer, signature FROM fts_functions WHERE fts_functions MATCH ?", (fts_query,)).fetchall()
    if rows:
        print(f"\nC ABI FUNCTIONS ({len(rows)}):")
        for r in rows:
            print(f"  [{r['layer']:4s}] {r['name']}  ({r['category']})")

    # C++ Methods
    try:
        rows = conn.execute("SELECT class_name, method, signature, layer FROM fts_methods WHERE fts_methods MATCH ?", (fts_query,)).fetchall()
        if rows:
            print(f"\nC++ METHODS ({len(rows)}):")
            for r in rows:
                cls = r['class_name'] or '(free)'
                print(f"  [{r['layer']:4s}] {cls}::{r['method']}")
    except Exception:
        pass

    # ABI Routing
    try:
        rows = conn.execute("SELECT abi_function, internal_call, layer FROM fts_routing WHERE fts_routing MATCH ?", (fts_query,)).fetchall()
        if rows:
            print(f"\nABI ROUTING ({len(rows)}):")
            for r in rows:
                print(f"  [{r['layer']:4s}] {r['abi_function']} -> {r['internal_call']}")
    except Exception:
        pass

    # Docs
    rows = conn.execute("SELECT path, title, category FROM fts_docs WHERE fts_docs MATCH ?", (fts_query,)).fetchall()
    if rows:
        print(f"\nDOCS ({len(rows)}):")
        for r in rows:
            print(f"  {r['path']}  ({r['category']})")

    # Semantic tags
    rows = conn.execute("""SELECT entity_type, entity_id, tag, domain
                           FROM fts_tags WHERE fts_tags MATCH ?
                           LIMIT 20""", (fts_query,)).fetchall()
    if rows:
        print(f"\nSEMANTIC TAGS ({len(rows)}):")
        for r in rows:
            print(f"  [{r['entity_type']}] {r['entity_id']}  ->  {r['tag']} ({r['domain']})")

    conn.close()

def cmd_file(path: str):
    """Show everything known about a file."""
    conn = get_conn()
    r = conn.execute("SELECT * FROM source_files WHERE path LIKE ?", (f'%{path}%',)).fetchone()
    if not r:
        print(f"File not found: {path}")
        return

    print(f"FILE: {r['path']}")
    print(f"  Category:  {r['category']}")
    print(f"  Subsystem: {r['subsystem'] or '-'}")
    print(f"  Layer:     {r['layer']}")
    print(f"  Lines:     {r['lines']}")
    print(f"  Type:      {r['file_type']}")

    # Dependencies
    deps = conn.execute("SELECT included_file FROM include_deps WHERE source_file=?", (r['path'],)).fetchall()
    if deps:
        print(f"\n  INCLUDES ({len(deps)}):")
        for d in deps:
            print(f"    {d['included_file']}")

    # Reverse deps
    rdeps = conn.execute("SELECT source_file FROM include_deps WHERE included_file LIKE ?", (f'%{Path(r["path"]).name}%',)).fetchall()
    if rdeps:
        print(f"\n  INCLUDED BY ({len(rdeps)}):")
        for d in rdeps:
            print(f"    {d['source_file']}")

    # Tests covering this file
    tests = conn.execute("""SELECT src_id FROM edges
        WHERE dst_type='source_file' AND dst_id=? AND relation='covers'""", (r['path'],)).fetchall()
    if tests:
        print(f"\n  TESTED BY ({len(tests)}):")
        for t in tests:
            print(f"    {t['src_id']}")

    # ABI functions implementing through this file
    funcs = conn.execute("""SELECT src_id FROM edges
        WHERE dst_type='source_file' AND dst_id=? AND relation='implements'""", (r['path'],)).fetchall()
    if funcs:
        print(f"\n  ABI FUNCTIONS ({len(funcs)}):")
        for f in funcs:
            print(f"    {f['src_id']}")

    conn.close()

def cmd_subsystem(name: str):
    """List all files and functions in a subsystem."""
    conn = get_conn()
    rows = conn.execute("SELECT path, category, layer, lines FROM source_files WHERE subsystem=? ORDER BY lines DESC", (name,)).fetchall()
    print(f"=== Subsystem: {name} ({len(rows)} files) ===\n")
    total_lines = 0
    for r in rows:
        print(f"  [{r['layer']:4s}] {r['path']:60s} {r['lines']:5d} lines")
        total_lines += r['lines']
    print(f"\n  Total: {total_lines} lines")

    funcs = conn.execute("SELECT name, layer FROM c_abi_functions WHERE category=?", (name,)).fetchall()
    if funcs:
        print(f"\n  C ABI FUNCTIONS ({len(funcs)}):")
        for f in funcs:
            print(f"    [{f['layer']:4s}] {f['name']}")
    conn.close()

def cmd_deps(path: str):
    """Show include dependencies for a source file."""
    conn = get_conn()
    rows = conn.execute("SELECT included_file, is_local FROM include_deps WHERE source_file LIKE ? ORDER BY is_local DESC, included_file",
                        (f'%{path}%',)).fetchall()
    print(f"=== Dependencies of {path} ({len(rows)}) ===\n")
    for r in rows:
        kind = 'local' if r['is_local'] else 'system'
        print(f"  [{kind:6s}] {r['included_file']}")
    conn.close()

def cmd_rdeps(header: str):
    """Show reverse dependencies (who includes this header)."""
    conn = get_conn()
    rows = conn.execute("SELECT source_file FROM include_deps WHERE included_file LIKE ? ORDER BY source_file",
                        (f'%{header}%',)).fetchall()
    print(f"=== Reverse deps of {header} ({len(rows)} files include it) ===\n")
    for r in rows:
        print(f"  {r['source_file']}")
    conn.close()

def cmd_abi(category: str = None):
    """List C ABI functions, optionally filtered by category."""
    conn = get_conn()
    if category:
        rows = conn.execute("SELECT name, category, layer, line_no FROM c_abi_functions WHERE category=? ORDER BY line_no", (category,)).fetchall()
    else:
        rows = conn.execute("SELECT name, category, layer, line_no FROM c_abi_functions ORDER BY category, line_no").fetchall()
    print(f"=== C ABI Functions ({len(rows)}) ===\n")
    for r in rows:
        print(f"  [{r['layer']:4s}] {r['name']:50s} ({r['category']}, L{r['line_no']})")
    conn.close()

def cmd_test(filter_str: str = None):
    """List test targets, optionally filtered."""
    conn = get_conn()
    if filter_str:
        rows = conn.execute("""SELECT name, category, timeout, labels FROM test_targets
            WHERE name LIKE ? OR category LIKE ? OR labels LIKE ? ORDER BY name""",
            (f'%{filter_str}%', f'%{filter_str}%', f'%{filter_str}%')).fetchall()
    else:
        rows = conn.execute("SELECT name, category, timeout, labels FROM test_targets ORDER BY category, name").fetchall()
    print(f"=== Test Targets ({len(rows)}) ===\n")
    for r in rows:
        print(f"  {r['name']:40s} [{r['category']:20s}] timeout={r['timeout']}s  {r['labels']}")
    conn.close()

def cmd_layer(layer: str):
    """List all files in a specific layer."""
    conn = get_conn()
    rows = conn.execute("SELECT path, category, subsystem, lines FROM source_files WHERE layer=? ORDER BY lines DESC",
                        (layer,)).fetchall()
    total = sum(r['lines'] for r in rows)
    print(f"=== Layer: {layer} ({len(rows)} files, {total} lines) ===\n")
    for r in rows[:30]:
        print(f"  {r['path']:60s} {r['lines']:5d}  ({r['category']}, {r['subsystem'] or '-'})")
    if len(rows) > 30:
        print(f"  ... and {len(rows) - 30} more files")
    conn.close()

def cmd_function(name: str):
    """Show details of a specific C ABI function."""
    conn = get_conn()
    r = conn.execute("SELECT * FROM c_abi_functions WHERE name LIKE ?", (f'%{name}%',)).fetchone()
    if not r:
        print(f"Function not found: {name}")
        return
    print(f"FUNCTION: {r['name']}")
    print(f"  Category:  {r['category']}")
    print(f"  Layer:     {r['layer']}")
    print(f"  Line:      {r['line_no']}")
    print(f"  Signature: {r['signature']}")

    # Implementation file
    impl = conn.execute("""SELECT dst_id FROM edges
        WHERE src_type='c_abi_function' AND src_id=? AND relation='implements'""", (r['name'],)).fetchone()
    if impl:
        print(f"  Impl:      {impl['dst_id']}")
    conn.close()

def cmd_audit(section: str = None):
    """List audit modules, optionally filtered by section."""
    conn = get_conn()
    if section:
        rows = conn.execute("SELECT * FROM audit_modules WHERE section LIKE ? ORDER BY section_no, module_id",
                            (f'%{section}%',)).fetchall()
    else:
        rows = conn.execute("SELECT * FROM audit_modules ORDER BY section_no, module_id").fetchall()
    print(f"=== Audit Modules ({len(rows)}) ===\n")
    cur_section = None
    for r in rows:
        if r['section'] != cur_section:
            cur_section = r['section']
            print(f"\n  [{r['section_no']}] {cur_section.upper()}:")
        print(f"    {r['module_id']:25s} {r['name']}")
    conn.close()

def cmd_platform(platform: str):
    """Show platform-specific dispatch info."""
    conn = get_conn()
    rows = conn.execute("SELECT * FROM platform_dispatch WHERE platform LIKE ? ORDER BY source_file",
                        (f'%{platform}%',)).fetchall()
    print(f"=== Platform: {platform} ({len(rows)} dispatch points) ===\n")
    for r in rows:
        print(f"  {r['source_file']:40s} [{r['mechanism']:12s}] {r['description']}")
    conn.close()

def cmd_summary():
    """Show database summary statistics."""
    conn = get_conn()
    stats = json.loads(conn.execute("SELECT value FROM meta WHERE key='stats'").fetchone()['value'])
    built = conn.execute("SELECT value FROM meta WHERE key='built_at'").fetchone()['value']
    version = conn.execute("SELECT value FROM meta WHERE key='version'").fetchone()['value']

    print(f"=== Project Knowledge Graph v{version} ===")
    print(f"  Built: {built}")
    print(f"  Database: {DB_PATH} ({DB_PATH.stat().st_size / 1024:.0f} KB)\n")

    total = sum(stats.values())
    print(f"TABLES ({total} total records):")
    for table, count in sorted(stats.items()):
        print(f"  {table:25s} {count:5d}")

    print(f"\nLAYER SUMMARY:")
    for r in conn.execute("SELECT * FROM v_layer_summary").fetchall():
        print(f"  {r['layer']:5s} {r['file_count']:4d} files  {r['total_lines']:6d} lines")

    print(f"\nTOP 10 SUBSYSTEMS:")
    for r in conn.execute("SELECT * FROM v_subsystem_files LIMIT 10").fetchall():
        print(f"  {r['subsystem']:15s} {r['file_count']:3d} files  {r['total_lines']:6d} lines")
    conn.close()

def cmd_sql(query: str):
    """Execute raw SQL query."""
    conn = get_conn()
    try:
        rows = conn.execute(query).fetchall()
        if rows:
            # Print header
            cols = rows[0].keys()
            print('|'.join(cols))
            print('-' * 80)
            for r in rows:
                print('|'.join(str(r[c]) for c in cols))
        else:
            print("(no results)")
    except Exception as e:
        print(f"SQL ERROR: {e}")
    conn.close()

def cmd_methods(class_name: str = None):
    """List C++ methods, optionally filtered by class."""
    conn = get_conn()
    if class_name:
        rows = conn.execute("""SELECT class_name, method, signature, layer, header_path, line_no
            FROM cpp_methods WHERE class_name LIKE ? OR method LIKE ?
            ORDER BY class_name, line_no""",
            (f'%{class_name}%', f'%{class_name}%')).fetchall()
    else:
        rows = conn.execute("""SELECT class_name, method, signature, layer, header_path, line_no
            FROM cpp_methods ORDER BY class_name, line_no""").fetchall()
    print(f"=== C++ Methods ({len(rows)}) ===\n")
    cur_cls = None
    for r in rows:
        cls = r['class_name'] or '(free)'
        if cls != cur_cls:
            cur_cls = cls
            print(f"\n  {cur_cls}:")
        print(f"    [{r['layer']:4s}] {r['method']:30s} {r['signature']}")
    conn.close()

def cmd_security(file_filter: str = None):
    """Show security-critical patterns (secure_erase, value_barrier, CLASSIFY)."""
    conn = get_conn()
    if file_filter:
        rows = conn.execute("""SELECT pattern, source_file, line_no, context
            FROM security_patterns WHERE source_file LIKE ?
            ORDER BY source_file, line_no""",
            (f'%{file_filter}%',)).fetchall()
    else:
        rows = conn.execute("""SELECT source_file, pattern, COUNT(*) as cnt,
            GROUP_CONCAT(line_no) as lines
            FROM security_patterns GROUP BY source_file, pattern
            ORDER BY source_file""").fetchall()
    if file_filter:
        print(f"=== Security Patterns in *{file_filter}* ({len(rows)}) ===\n")
        for r in rows:
            print(f"  L{r['line_no']:4d} [{r['pattern']:15s}] {r['context'][:80]}")
    else:
        print(f"=== Security Pattern Hotspots ({len(rows)} file-pattern groups) ===\n")
        cur_file = None
        for r in rows:
            if r['source_file'] != cur_file:
                cur_file = r['source_file']
                print(f"\n  {cur_file}:")
            print(f"    {r['pattern']:15s} x{r['cnt']:2d}  lines: {r['lines']}")
    conn.close()

def cmd_routing(fn_filter: str = None):
    """Show ABI routing: which ufsecp_* maps to CT vs fast."""
    conn = get_conn()
    if fn_filter:
        rows = conn.execute("""SELECT abi_function, internal_call, layer, impl_line
            FROM abi_routing WHERE abi_function LIKE ? OR internal_call LIKE ?
            ORDER BY impl_line""",
            (f'%{fn_filter}%', f'%{fn_filter}%')).fetchall()
    else:
        rows = conn.execute("""SELECT abi_function, internal_call, layer, impl_line
            FROM abi_routing ORDER BY impl_line""").fetchall()
    print(f"=== ABI Routing ({len(rows)}) ===\n")
    for r in rows:
        line_str = f"L{r['impl_line']}" if r['impl_line'] else '   ?'
        print(f"  [{r['layer']:4s}] {r['abi_function']:45s} -> {r['internal_call']:35s} ({line_str})")
    conn.close()

def cmd_bindings(lang: str = None):
    """Show binding language info."""
    conn = get_conn()
    if lang:
        rows = conn.execute("SELECT * FROM binding_languages WHERE language LIKE ?",
            (f'%{lang}%',)).fetchall()
    else:
        rows = conn.execute("SELECT * FROM binding_languages ORDER BY status, language").fetchall()
    print(f"=== Binding Languages ({len(rows)}) ===\n")
    for r in rows:
        print(f"  {r['language']:15s} [{r['status']:12s}] {r['directory']:30s} {r['file_count']:3d} files  FFI: {r['ffi_method']:12s} pkg: {r['package_name']}")
    conn.close()

def cmd_macros(category: str = None):
    """Show compile-time macros and defines."""
    conn = get_conn()
    if category:
        rows = conn.execute("SELECT * FROM macros WHERE category LIKE ? ORDER BY name",
            (f'%{category}%',)).fetchall()
    else:
        rows = conn.execute("SELECT * FROM macros ORDER BY category, name").fetchall()
    print(f"=== Macros ({len(rows)}) ===\n")
    cur_cat = None
    for r in rows:
        if r['category'] != cur_cat:
            cur_cat = r['category']
            print(f"\n  [{cur_cat}]:")
        val = f"= {r['value']}" if r['value'] else ''
        print(f"    {r['name']:40s} {val:20s} ({r['file_path']}:{r['line_no']})")
    conn.close()

def cmd_impact(path: str):
    """Show full impact analysis for a file: deps, rdeps, tests, ABI, security."""
    conn = get_conn()
    # Find the file
    r = conn.execute("SELECT * FROM source_files WHERE path LIKE ?", (f'%{path}%',)).fetchone()
    if not r:
        print(f"File not found: {path}")
        return
    fpath = r['path']
    print(f"=== IMPACT ANALYSIS: {fpath} ===")
    print(f"  Layer: {r['layer']}, Subsystem: {r['subsystem']}, Lines: {r['lines']}\n")

    # Direct includes
    deps = conn.execute("SELECT included_file FROM include_deps WHERE source_file=?", (fpath,)).fetchall()
    print(f"  DEPENDS ON ({len(deps)}):")
    for d in deps:
        print(f"    {d['included_file']}")

    # Reverse deps
    fname = Path(fpath).name
    rdeps = conn.execute("SELECT source_file FROM include_deps WHERE included_file LIKE ?",
                         (f'%{fname}%',)).fetchall()
    print(f"\n  DEPENDED ON BY ({len(rdeps)}):")
    for d in rdeps:
        print(f"    {d['source_file']}")

    # Tests
    tests = conn.execute("""SELECT src_id FROM edges
        WHERE dst_type='source_file' AND dst_id=? AND relation='covers'""", (fpath,)).fetchall()
    print(f"\n  TESTED BY ({len(tests)}):")
    for t in tests:
        print(f"    {t['src_id']}")

    # ABI functions
    funcs = conn.execute("""SELECT src_id FROM edges
        WHERE dst_type='source_file' AND dst_id=? AND relation='implements'""", (fpath,)).fetchall()
    print(f"\n  ABI FUNCTIONS ({len(funcs)}):")
    for f in funcs:
        print(f"    {f['src_id']}")

    # Security patterns
    secs = conn.execute("SELECT pattern, line_no FROM security_patterns WHERE source_file=? ORDER BY line_no",
                        (fpath,)).fetchall()
    if secs:
        print(f"\n  SECURITY PATTERNS ({len(secs)}):")
        for s in secs:
            print(f"    L{s['line_no']:4d} {s['pattern']}")

    # ABI routing through this file
    routings = conn.execute("""SELECT abi_function, layer FROM abi_routing
        WHERE internal_call LIKE ? OR abi_function LIKE ?""",
        (f'%{fname.replace(".cpp","").replace(".hpp","")}%',
         f'%{fname.replace(".cpp","").replace(".hpp","")}%')).fetchall()
    if routings:
        print(f"\n  ABI ROUTING ({len(routings)}):")
        for rt in routings:
            print(f"    [{rt['layer']:4s}] {rt['abi_function']}")

    conn.close()

def cmd_gaps():
    """Show test coverage gaps -- core files with no test coverage."""
    conn = get_conn()
    rows = conn.execute("SELECT * FROM v_coverage_gaps").fetchall()
    total_lines = sum(r['lines'] for r in rows)
    print(f"=== Test Coverage Gaps ({len(rows)} untested core files, {total_lines} total lines) ===\n")
    for r in rows:
        sec = f"  SEC:{r['security_patterns']}" if r['security_patterns'] else ''
        abi = f"  ABI:{r['abi_functions']}" if r['abi_functions'] else ''
        print(f"  [{r['layer']:4s}] {r['path']:50s} {r['lines']:5d} lines  ({r['subsystem'] or '-'}){sec}{abi}")
    conn.close()

def cmd_context(path: str):
    """One-shot context dump: summary + deps + rdeps + tests + security + routing + functions.
    Replaces 5-6 separate queries. Designed for maximum token efficiency."""
    conn = get_conn()
    # Find file
    r = conn.execute("SELECT * FROM source_files WHERE path LIKE ?", (f'%{path}%',)).fetchone()
    if not r:
        print(f"File not found: {path}")
        conn.close()
        return
    fpath = r['path']

    # Summary
    summary = conn.execute("SELECT summary FROM file_summaries WHERE path=?", (fpath,)).fetchone()
    desc = summary['summary'] if summary else '(no summary)'
    print(f"FILE: {fpath}  [{r['layer']}] {r['lines']} lines")
    print(f"  {desc}")
    print(f"  category={r['category']}  subsystem={r['subsystem'] or '-'}")

    # Dependencies (compact)
    deps = conn.execute("SELECT included_file FROM include_deps WHERE source_file=?", (fpath,)).fetchall()
    if deps:
        print(f"\nINCLUDES ({len(deps)}): {', '.join(d['included_file'] for d in deps)}")

    # Reverse deps (compact)
    fname = Path(fpath).name
    rdeps = conn.execute("SELECT source_file FROM include_deps WHERE included_file LIKE ?",
                         (f'%{fname}%',)).fetchall()
    if rdeps:
        print(f"\nINCLUDED BY ({len(rdeps)}): {', '.join(d['source_file'] for d in rdeps)}")

    # Tests
    tests = conn.execute("""SELECT src_id FROM edges
        WHERE dst_type='source_file' AND dst_id=? AND relation='covers'""", (fpath,)).fetchall()
    if tests:
        print(f"\nTESTS ({len(tests)}): {', '.join(t['src_id'] for t in tests)}")
    else:
        print(f"\nTESTS: NONE (coverage gap!)")

    # ABI functions
    funcs = conn.execute("""SELECT src_id FROM edges
        WHERE dst_type='source_file' AND dst_id=? AND relation='implements'""", (fpath,)).fetchall()
    if funcs:
        print(f"\nABI ({len(funcs)}): {', '.join(f['src_id'] for f in funcs)}")

    # Security patterns (compact counts)
    secs = conn.execute("""SELECT pattern, COUNT(*) as cnt FROM security_patterns
        WHERE source_file=? GROUP BY pattern""", (fpath,)).fetchall()
    if secs:
        sec_str = ', '.join(f"{s['pattern']}:{s['cnt']}" for s in secs)
        print(f"\nSECURITY: {sec_str}")

    # ABI routing
    base = fname.replace('.cpp', '').replace('.hpp', '')
    routings = conn.execute("""SELECT abi_function, internal_call, layer FROM abi_routing
        WHERE internal_call LIKE ? OR abi_function LIKE ?""",
        (f'%{base}%', f'%{base}%')).fetchall()
    if routings:
        print(f"\nROUTING ({len(routings)}):")
        for rt in routings:
            print(f"  [{rt['layer']:4s}] {rt['abi_function']} -> {rt['internal_call']}")

    # Function index (key section for token savings)
    fidx = conn.execute("""SELECT name, start_line, end_line, kind, class_name
        FROM function_index WHERE file_path=? ORDER BY start_line""", (fpath,)).fetchall()
    if fidx:
        print(f"\nFUNCTIONS ({len(fidx)}):")
        for f in fidx:
            cls = f"{f['class_name']}::" if f['class_name'] else ''
            span = f['end_line'] - f['start_line'] + 1
            print(f"  L{f['start_line']:4d}-{f['end_line']:4d} ({span:3d}) {cls}{f['name']}")

    conn.close()

def cmd_preflight(mode: str = None):
    """Run preflight quality checks (delegates to scripts/preflight.py)."""
    import subprocess
    script = Path(__file__).resolve().parent / 'preflight.py'
    args = ['python3', str(script)]
    if mode:
        args.append(mode)
    subprocess.run(args)


# ---------------------------------------------------------------------------
# PHASE 4: new query commands
# ---------------------------------------------------------------------------

def cmd_callgraph(func_name: str):
    """Show call graph for a function: who calls it (callers) and who it calls (callees)."""
    conn = get_conn()
    print(f"=== Call Graph: {func_name} ===\n")

    # Callers
    callers = conn.execute("""SELECT DISTINCT caller_func, caller_file, call_line
        FROM call_edges WHERE callee_func LIKE ?
        ORDER BY caller_file, call_line""", (f'%{func_name}%',)).fetchall()
    if callers:
        print(f"CALLERS ({len(callers)}):")
        for r in callers:
            print(f"  {r['caller_func']:40s}  ({r['caller_file']}:L{r['call_line']})")
    else:
        print("CALLERS: none found in call graph")

    # Callees
    callees = conn.execute("""SELECT DISTINCT callee_func, callee_file, call_line
        FROM call_edges WHERE caller_func LIKE ?
        ORDER BY call_line""", (f'%{func_name}%',)).fetchall()
    if callees:
        print(f"\nCALLEES ({len(callees)}):")
        for r in callees:
            print(f"  L{r['call_line'] or '?':4}  {r['callee_func']:40s}  {r['callee_file'] or '(unknown)'}")
    else:
        print("\nCALLEES: none found in call graph")

    conn.close()


def cmd_hotspots(top_n: str = '15'):
    """Show top N hotspot files ranked by composite risk score."""
    try:
        n = int(top_n)
    except (TypeError, ValueError):
        n = 15
    conn = get_conn()
    rows = conn.execute("""SELECT file_path, hotspot_score, coupling_score,
                                  security_density, test_coverage_gap,
                                  null_risk_score, reasons
                           FROM hotspot_scores
                           ORDER BY hotspot_score DESC LIMIT ?""", (n,)).fetchall()
    if not rows:
        print("No hotspot data. Rebuild graph with: python3 scripts/build_project_graph.py --rebuild")
        conn.close()
        return
    print(f"=== Top {n} Hotspot Files ===\n")
    print(f"  {'SCORE':>5}  {'COUP':>5}  {'SEC':>5}  {'GAP':>4}  FILE")
    print(f"  {'-'*5}  {'-'*5}  {'-'*5}  {'-'*4}  {'-'*50}")
    for r in rows:
        reasons = r['reasons'] or '[]'
        try:
            rl = json.loads(reasons)
        except Exception:
            rl = []
        tag = ','.join(rl[:2])
        print(f"  {r['hotspot_score']:>5.2f}  {r['coupling_score']:>5.2f}  "
              f"{r['security_density']:>5.2f}  {r['test_coverage_gap']:>4.0f}  "
              f"{r['file_path']}  [{tag}]")
    conn.close()


def cmd_dead(filter_str: str = None):
    """Show potentially dead/unreachable code from reachability analysis."""
    conn = get_conn()
    if filter_str:
        rows = conn.execute("""SELECT symbol, file_path, dead_reason, reach_via
            FROM reachability WHERE is_reachable=0 AND (symbol LIKE ? OR file_path LIKE ?)
            ORDER BY file_path, symbol""",
            (f'%{filter_str}%', f'%{filter_str}%')).fetchall()
    else:
        rows = conn.execute("""SELECT symbol, file_path, dead_reason, reach_via
            FROM reachability WHERE is_reachable=0 ORDER BY file_path, symbol""").fetchall()
    total = conn.execute("SELECT COUNT(*) AS cnt FROM reachability WHERE is_reachable=0").fetchone()['cnt']
    reachable = conn.execute("SELECT COUNT(*) AS cnt FROM reachability WHERE is_reachable=1").fetchone()['cnt']
    print(f"=== Dead Code Analysis ({total} unreachable / {reachable + total} total) ===\n")
    if not rows:
        print("  No unreachable functions found (or graph not built with call edges).")
        conn.close()
        return
    cur_file = None
    for r in rows[:100]:
        if r['file_path'] != cur_file:
            cur_file = r['file_path']
            print(f"\n  {cur_file}:")
        print(f"    {r['symbol']:40s}  [{r['dead_reason'] or 'no_caller'}]")
    if len(rows) > 100:
        print(f"\n  ... and {len(rows) - 100} more (use filter to narrow down)")
    conn.close()


def cmd_aliases(symbol: str = None):
    """Show symbol aliases and similar names (variant/typo detection)."""
    conn = get_conn()
    if symbol:
        rows = conn.execute("""SELECT canonical, alias, similarity, kind
            FROM symbol_aliases
            WHERE canonical LIKE ? OR alias LIKE ?
            ORDER BY similarity DESC""",
            (f'%{symbol}%', f'%{symbol}%')).fetchall()
    else:
        rows = conn.execute("""SELECT canonical, alias, similarity, kind
            FROM symbol_aliases ORDER BY similarity DESC LIMIT 50""").fetchall()
    total = conn.execute("SELECT COUNT(*) AS cnt FROM symbol_aliases").fetchone()['cnt']
    print(f"=== Symbol Aliases ({total} total, showing {len(rows)}) ===\n")
    if not rows:
        print("  No aliases found. (Rebuild graph to generate.)")
        conn.close()
        return
    for r in rows:
        print(f"  [{r['kind']:12s}] {r['similarity']:.3f}  {r['canonical']:40s}  ~=  {r['alias']}")
    conn.close()


def cmd_coverage(func_name: str = None):
    """Show which test targets cover a function (function-level coverage map)."""
    conn = get_conn()
    if func_name:
        rows = conn.execute("""SELECT ftm.function_name, ftm.function_file, ftm.test_target,
                                      ftm.coverage_type, fi.start_line, fi.end_line
                               FROM function_test_map ftm
                               LEFT JOIN function_index fi
                                   ON fi.file_path = ftm.function_file
                                   AND fi.name = ftm.function_name
                               WHERE ftm.function_name LIKE ?
                               ORDER BY ftm.function_file""",
                            (f'%{func_name}%',)).fetchall()
        print(f"=== Test Coverage: *{func_name}* ({len(rows)} mappings) ===\n")
        for r in rows:
            span = f"L{r['start_line']}-{r['end_line']}" if r['start_line'] else '?'
            print(f"  {r['function_name']:40s} {span:12s}  <- {r['test_target']}  [{r['coverage_type']}]")
    else:
        # Summary: files covered vs uncovered
        covered = conn.execute("SELECT COUNT(DISTINCT function_file) AS cnt FROM function_test_map").fetchone()['cnt']
        total_files = conn.execute("SELECT COUNT(DISTINCT file_path) AS cnt FROM function_index").fetchone()['cnt']
        total_funcs = conn.execute("SELECT COUNT(*) AS cnt FROM function_test_map").fetchone()['cnt']
        print(f"=== Function Coverage Summary ===\n")
        print(f"  Files with coverage: {covered}/{total_files}")
        print(f"  Total (function, test) mappings: {total_funcs}")
        print(f"\nTop covered files:")
        for r in conn.execute("""SELECT function_file, COUNT(DISTINCT test_target) AS tests,
                                         COUNT(DISTINCT function_name) AS funcs
                                  FROM function_test_map
                                  GROUP BY function_file ORDER BY tests DESC LIMIT 15""").fetchall():
            print(f"  {r['function_file']:55s} {r['tests']:3d} tests  {r['funcs']:4d} functions")
    conn.close()


def cmd_config(filter_type: str = None):
    """Show config/CMake option -> code symbol bindings."""
    conn = get_conn()
    if filter_type:
        rows = conn.execute("""SELECT config_file, config_key, code_symbol, code_file,
                                      binding_type, description
                               FROM config_bindings WHERE binding_type LIKE ? OR config_file LIKE ?
                               ORDER BY binding_type, config_key""",
                            (f'%{filter_type}%', f'%{filter_type}%')).fetchall()
    else:
        rows = conn.execute("""SELECT config_file, config_key, code_symbol, code_file,
                                      binding_type, description
                               FROM config_bindings ORDER BY binding_type, config_key""").fetchall()
    print(f"=== Config Bindings ({len(rows)}) ===\n")
    cur_type = None
    for r in rows:
        if r['binding_type'] != cur_type:
            cur_type = r['binding_type']
            print(f"\n  [{cur_type}]:")
        file_str = f"  ({r['code_file']})" if r['code_file'] else ''
        print(f"    {r['config_key']:40s}  ->  {r['code_symbol']}{file_str}")
    conn.close()


def cmd_tags(filter_str: str = None):
    """List semantic tags and their coverage across entities."""
    conn = get_conn()
    if filter_str:
        rows = conn.execute("""
            SELECT st.tag, st.domain, st.description, COUNT(et.id) AS tagged_entities
            FROM semantic_tags st
            LEFT JOIN entity_tags et ON et.tag = st.tag
            WHERE st.tag LIKE ? OR st.domain LIKE ? OR st.description LIKE ?
            GROUP BY st.tag, st.domain, st.description
            ORDER BY tagged_entities DESC, st.tag
        """, (f'%{filter_str}%', f'%{filter_str}%', f'%{filter_str}%')).fetchall()
    else:
        rows = conn.execute("""
            SELECT st.tag, st.domain, st.description, COUNT(et.id) AS tagged_entities
            FROM semantic_tags st
            LEFT JOIN entity_tags et ON et.tag = st.tag
            GROUP BY st.tag, st.domain, st.description
            ORDER BY tagged_entities DESC, st.tag
        """).fetchall()
    print(f"=== Semantic Tags ({len(rows)}) ===\n")
    for r in rows:
        print(f"  {r['tag']:24s} [{r['domain']}]  entities={r['tagged_entities']}")
        print(f"    {r['description']}")
    conn.close()


def cmd_tag(tag: str):
    """Show entities carrying a specific semantic tag."""
    conn = get_conn()
    rows = conn.execute("""
        SELECT entity_type, entity_id, confidence, origin
        FROM entity_tags
        WHERE tag LIKE ?
        ORDER BY entity_type, confidence DESC, entity_id
    """, (f'%{tag}%',)).fetchall()
    print(f"=== Semantic Tag: {tag} ({len(rows)} entities) ===\n")
    if not rows:
        print("  No entities found.")
        conn.close()
        return
    current_type = None
    for r in rows:
        if r['entity_type'] != current_type:
            current_type = r['entity_type']
            print(f"\n  [{current_type}]")
        print(f"    {r['entity_id']}  (confidence={r['confidence']:.2f}, {r['origin']})")
    conn.close()


def cmd_symbol(name: str):
    """Show the full reasoning profile for a function/symbol."""
    conn = get_conn()
    rows = conn.execute("""
        SELECT *
        FROM v_symbol_reasoning
        WHERE symbol_name LIKE ?
        ORDER BY optimization_priority DESC, risk_score DESC, file_path
    """, (f'%{name}%',)).fetchall()
    print(f"=== Symbol Reasoning: {name} ({len(rows)}) ===\n")
    if not rows:
        print("  No symbol found.")
        conn.close()
        return
    for r in rows[:20]:
        print(f"{r['symbol_name']}  [{r['file_path']}]")
        print(f"  semantic: category={r['category']} math_core={r['math_core']} backend={r['backend']} coord={r['coordinate_model']}")
        print(f"  security: secret_class={r['secret_class']} secret={r['uses_secret_input']} ct={r['must_be_constant_time']} public_only={r['public_data_only']}")
        print(f"  perf: hotness={r['hotness_score']:.1f} gpu_candidate={r['gpu_candidate']} batchable={r['batchable']}")
        print(f"  audit: unit={r['covered_by_unit_test']} fuzz={r['covered_by_fuzz']} ct={r['covered_by_ct_test']}")
        print(f"  history: modified={r['times_modified']} recent={r['recently_modified']}")
        print(f"  scores: risk={r['risk_score']:.1f} gain={r['gain_score']:.1f} priority={r['optimization_priority']:.1f}")
        print()
    conn.close()


def cmd_optimize(top_n: str = '15'):
    """Show high-gain / lower-risk optimization candidates."""
    try:
        n = int(top_n)
    except (TypeError, ValueError):
        n = 15
    conn = get_conn()
    rows = conn.execute("""
        SELECT symbol_name, file_path, category, backend, hotness_score, gpu_candidate,
               batchable, risk_score, gain_score, optimization_priority
        FROM v_symbol_reasoning
        WHERE category NOT IN ('test', 'audit', 'fuzz')
        ORDER BY optimization_priority DESC, gain_score DESC
        LIMIT ?
    """, (n,)).fetchall()
    print(f"=== Optimization Candidates ({len(rows)}) ===\n")
    for r in rows:
        print(f"  {r['optimization_priority']:>5.1f}  gain={r['gain_score']:>5.1f}  risk={r['risk_score']:>5.1f}  "
              f"{r['symbol_name']}  [{r['category']}, {r['backend']}]")
        print(f"         {r['file_path']}  hotness={r['hotness_score']:.1f} batchable={r['batchable']} gpu_candidate={r['gpu_candidate']}")
    conn.close()


def cmd_risk(top_n: str = '15'):
    """Show high-risk / high-impact symbols that deserve manual review."""
    try:
        n = int(top_n)
    except (TypeError, ValueError):
        n = 15
    conn = get_conn()
    rows = conn.execute("""
        SELECT symbol_name, file_path, category, secret_class, risk_score, gain_score,
               covered_by_unit_test, covered_by_fuzz, covered_by_ct_test, recently_modified
        FROM v_symbol_reasoning
        ORDER BY risk_score DESC, gain_score DESC
        LIMIT ?
    """, (n,)).fetchall()
    print(f"=== Risk Hotspots ({len(rows)}) ===\n")
    for r in rows:
        print(f"  risk={r['risk_score']:>5.1f}  gain={r['gain_score']:>5.1f}  {r['symbol_name']}  [{r['category']}, {r['secret_class']}]")
        print(f"       {r['file_path']}  unit={r['covered_by_unit_test']} fuzz={r['covered_by_fuzz']} ct={r['covered_by_ct_test']} recent={r['recently_modified']}")
    conn.close()


def cmd_gpuwork(top_n: str = '15'):
    """Show top CPU symbols that look like GPU/offload candidates."""
    try:
        n = int(top_n)
    except (TypeError, ValueError):
        n = 15
    conn = get_conn()
    rows = conn.execute("""
        SELECT symbol_name, file_path, category, hotness_score, batchable,
               compute_bound, risk_score, gain_score, optimization_priority
        FROM v_symbol_reasoning
        WHERE backend='cpu' AND gpu_candidate=1
        ORDER BY gain_score DESC, optimization_priority DESC
        LIMIT ?
    """, (n,)).fetchall()
    print(f"=== GPU Candidate Symbols ({len(rows)}) ===\n")
    for r in rows:
        print(f"  gain={r['gain_score']:>5.1f}  risk={r['risk_score']:>5.1f}  {r['symbol_name']}  [{r['category']}]")
        print(f"       {r['file_path']}  hotness={r['hotness_score']:.1f} batchable={r['batchable']} compute_bound={r['compute_bound']} priority={r['optimization_priority']:.1f}")
    conn.close()


def cmd_fragile(top_n: str = '15'):
    """Show ct-sensitive or invalid-input-sensitive symbols with weak coverage and recent churn."""
    try:
        n = int(top_n)
    except (TypeError, ValueError):
        n = 15
    conn = get_conn()
    rows = conn.execute("""
        SELECT ss.symbol_name, ss.file_path, ss.secret_class,
               sec.invalid_input_sensitive, cov.covered_by_unit_test,
               cov.covered_by_fuzz, cov.covered_by_ct_test,
               cov.known_fragile, hist.recently_modified, score.risk_score
        FROM symbol_semantics ss
        JOIN symbol_security sec
          ON sec.symbol_name = ss.symbol_name AND sec.file_path = ss.file_path
        JOIN symbol_audit_coverage cov
          ON cov.symbol_name = ss.symbol_name AND cov.file_path = ss.file_path
        JOIN symbol_history hist
          ON hist.symbol_name = ss.symbol_name AND hist.file_path = ss.file_path
        JOIN symbol_scores score
          ON score.symbol_name = ss.symbol_name AND score.file_path = ss.file_path
        WHERE (sec.must_be_constant_time=1 OR sec.invalid_input_sensitive=1)
          AND (cov.covered_by_fuzz=0 OR cov.covered_by_ct_test=0)
        ORDER BY score.risk_score DESC, hist.recently_modified DESC, cov.known_fragile DESC
        LIMIT ?
    """, (n,)).fetchall()
    print(f"=== Fragile Symbols ({len(rows)}) ===\n")
    for r in rows:
        print(f"  risk={r['risk_score']:>5.1f}  {r['symbol_name']}  [{r['secret_class']}]")
        print(f"       {r['file_path']}  invalid_input={r['invalid_input_sensitive']} unit={r['covered_by_unit_test']} fuzz={r['covered_by_fuzz']} ct={r['covered_by_ct_test']} recent={r['recently_modified']} fragile={r['known_fragile']}")
    conn.close()


COMMANDS = {
    'search': ('search <query>', cmd_search),
    'file': ('file <path>', cmd_file),
    'subsystem': ('subsystem <name>', cmd_subsystem),
    'deps': ('deps <source_file>', cmd_deps),
    'rdeps': ('rdeps <header>', cmd_rdeps),
    'abi': ('abi [category]', cmd_abi),
    'test': ('test [filter]', cmd_test),
    'layer': ('layer <name>', cmd_layer),
    'function': ('function <name>', cmd_function),
    'audit': ('audit [section]', cmd_audit),
    'platform': ('platform <name>', cmd_platform),
    'summary': ('summary', cmd_summary),
    'sql': ('sql "<query>"', cmd_sql),
    'methods': ('methods [class]', cmd_methods),
    'security': ('security [file]', cmd_security),
    'routing': ('routing [function]', cmd_routing),
    'bindings': ('bindings [language]', cmd_bindings),
    'macros': ('macros [category]', cmd_macros),
    'impact': ('impact <file>', cmd_impact),
    'gaps': ('gaps', cmd_gaps),
    'context': ('context <file>', cmd_context),
    'preflight': ('preflight [--security|--coverage|--abi]', cmd_preflight),
    # Phase 4: new commands
    'callgraph': ('callgraph <function>', cmd_callgraph),
    'hotspots': ('hotspots [N]', cmd_hotspots),
    'dead': ('dead [filter]', cmd_dead),
    'aliases': ('aliases [symbol]', cmd_aliases),
    'coverage': ('coverage [function]', cmd_coverage),
    'config': ('config [type]', cmd_config),
    'tags': ('tags [filter]', cmd_tags),
    'tag': ('tag <name>', cmd_tag),
    'symbol': ('symbol <name>', cmd_symbol),
    'optimize': ('optimize [N]', cmd_optimize),
    'risk': ('risk [N]', cmd_risk),
    'gpuwork': ('gpuwork [N]', cmd_gpuwork),
    'fragile': ('fragile [N]', cmd_fragile),
}

if __name__ == '__main__':
    if len(sys.argv) < 2 or sys.argv[1] not in COMMANDS:
        print("Usage: query_graph.py <command> [args]\n")
        print("Commands:")
        for name, (usage, _) in sorted(COMMANDS.items()):
            print(f"  {usage}")
        sys.exit(1)

    cmd_name = sys.argv[1]
    args = ' '.join(sys.argv[2:]) if len(sys.argv) > 2 else None
    handler = COMMANDS[cmd_name][1]

    if args:
        handler(args)
    else:
        handler()