mirror of
https://github.com/Kaelio/ktx.git
synced 2026-06-07 07:55:13 +02:00
* docs(specs): design research-agent MCP tools and ktx mcp daemon Adds the 2026-05-14 design spec for exposing four new MCP tools (discover_data, entity_details, dictionary_search, sql_execution), shipping a ktx-research skill, and introducing an HTTP-only ktx mcp daemon so external agents can use KTX as a research-capable context layer. * Refine research-agent MCP tools spec after adversarial review iteration 1 * Refine research-agent MCP tools spec after adversarial review iteration 2 * Refine research-agent MCP tools spec after adversarial review iteration 3 * Refine spec: drop connectionName compat carve-out and ground summary/snippet provenance per kind * feat(daemon): validate read-only SQL with sqlglot * feat(context): expose read-only SQL validation port * feat(context): register MCP sql execution tool * feat(context): execute MCP SQL through validated connector path * test(context): update SQL analysis port fixtures * docs: add research-agent MCP sql execution foundation plan * feat(context): add scan-backed entity details service * feat(context): register MCP entity details tool * feat(context): expose local MCP entity details * test(context): align entity details scan fixtures * docs: add research-agent MCP entity_details plan * feat(context): add dictionary search service * feat(context): register MCP dictionary search tool * feat(context): expose local MCP dictionary search * docs: add research-agent MCP dictionary_search plan * feat: add MCP discover data service * feat: expose discover data MCP tool * feat: wire local discover data MCP port * docs: add research-agent MCP discover_data plan * feat(cli): add mcp http security helpers * feat(cli): host mcp over streamable http * feat(cli): manage mcp daemon lifecycle * feat(cli): add ktx mcp commands * fix(cli): stabilize mcp daemon verification * docs: add research-agent MCP http daemon plan * feat(cli): install KTX research skill * feat(cli): configure MCP clients in setup agents * feat(cli): support Claude local MCP setup scope * docs: add research-agent MCP setup-agents plan * refactor(context): use connectionId in warehouse verification tools * docs(context): update ingest verification prompts for connectionId * docs: add research-agent MCP ingest contract convergence plan * chore: build runtime artifacts in conductor setup --------- Co-authored-by: Andrey Avtomonov <7889985+andreybavt@users.noreply.github.com>
131 lines
4.3 KiB
Python
131 lines
4.3 KiB
Python
from __future__ import annotations
|
|
|
|
from ktx_daemon.sql_analysis import (
|
|
AnalyzeSqlBatchItem,
|
|
AnalyzeSqlBatchRequest,
|
|
ValidateReadOnlySqlRequest,
|
|
_columns_from_nodes,
|
|
analyze_sql_batch_response,
|
|
validate_read_only_sql_response,
|
|
)
|
|
|
|
|
|
def test_analyze_sql_batch_extracts_tables_and_clause_columns() -> None:
|
|
response = analyze_sql_batch_response(
|
|
AnalyzeSqlBatchRequest(
|
|
dialect="postgres",
|
|
items=[
|
|
AnalyzeSqlBatchItem(
|
|
id="orders_by_customer",
|
|
sql=(
|
|
"select o.status, count(*) "
|
|
"from public.orders o "
|
|
"join public.customers c on o.customer_id = c.id "
|
|
"where o.created_at >= current_date - interval '30 day' "
|
|
"group by o.status"
|
|
),
|
|
)
|
|
],
|
|
max_workers=1,
|
|
)
|
|
)
|
|
|
|
result = response.results["orders_by_customer"]
|
|
assert result.error is None
|
|
assert result.tables_touched == ["public.orders", "public.customers"]
|
|
assert result.columns_by_clause == {
|
|
"select": ["status"],
|
|
"where": ["created_at"],
|
|
"join": ["customer_id", "id"],
|
|
"groupBy": ["status"],
|
|
}
|
|
|
|
|
|
def test_analyze_sql_batch_returns_per_item_parse_errors() -> None:
|
|
response = analyze_sql_batch_response(
|
|
AnalyzeSqlBatchRequest(
|
|
dialect="postgres",
|
|
items=[AnalyzeSqlBatchItem(id="broken", sql="select * from where")],
|
|
max_workers=1,
|
|
)
|
|
)
|
|
|
|
result = response.results["broken"]
|
|
assert result.tables_touched == []
|
|
assert result.columns_by_clause == {}
|
|
assert result.error is not None
|
|
|
|
|
|
def test_columns_from_nodes_ignores_non_expression_clause_values() -> None:
|
|
assert _columns_from_nodes([True, False, None]) == []
|
|
|
|
|
|
def test_validate_read_only_sql_accepts_select_and_with_queries() -> None:
|
|
select_response = validate_read_only_sql_response(
|
|
ValidateReadOnlySqlRequest(
|
|
dialect="postgres",
|
|
sql="select id, status from public.orders where status = 'paid'",
|
|
)
|
|
)
|
|
with_response = validate_read_only_sql_response(
|
|
ValidateReadOnlySqlRequest(
|
|
dialect="postgres",
|
|
sql=(
|
|
"with paid as (select * from public.orders where status = 'paid') "
|
|
"select count(*) from paid"
|
|
),
|
|
)
|
|
)
|
|
|
|
assert select_response.ok is True
|
|
assert select_response.error is None
|
|
assert with_response.ok is True
|
|
assert with_response.error is None
|
|
|
|
|
|
def test_validate_read_only_sql_rejects_cte_dml() -> None:
|
|
response = validate_read_only_sql_response(
|
|
ValidateReadOnlySqlRequest(
|
|
dialect="postgres",
|
|
sql="with x as (insert into audit.events values (1) returning *) select * from x",
|
|
)
|
|
)
|
|
|
|
assert response.ok is False
|
|
assert response.error == "SQL contains read/write operation: Insert"
|
|
|
|
|
|
def test_validate_read_only_sql_rejects_multi_statement_payloads() -> None:
|
|
response = validate_read_only_sql_response(
|
|
ValidateReadOnlySqlRequest(
|
|
dialect="postgres",
|
|
sql="select * from public.orders; delete from public.orders",
|
|
)
|
|
)
|
|
|
|
assert response.ok is False
|
|
assert response.error == "Only one SQL statement can be executed."
|
|
|
|
|
|
def test_validate_read_only_sql_rejects_commands_and_pragmas() -> None:
|
|
command_response = validate_read_only_sql_response(
|
|
ValidateReadOnlySqlRequest(dialect="postgres", sql="call refresh_stats()")
|
|
)
|
|
pragma_response = validate_read_only_sql_response(
|
|
ValidateReadOnlySqlRequest(dialect="sqlite", sql="pragma table_info(users)")
|
|
)
|
|
|
|
assert command_response.ok is False
|
|
assert command_response.error == "SQL contains read/write operation: Command"
|
|
assert pragma_response.ok is False
|
|
assert pragma_response.error == "SQL contains read/write operation: Pragma"
|
|
|
|
|
|
def test_validate_read_only_sql_reports_parse_errors() -> None:
|
|
response = validate_read_only_sql_response(
|
|
ValidateReadOnlySqlRequest(dialect="postgres", sql="select * from where")
|
|
)
|
|
|
|
assert response.ok is False
|
|
assert response.error is not None
|
|
assert "Invalid expression" in response.error
|