trustgraph/tests/unit/test_agent/test_completion_dispatch.py

"""
Unit tests for completion dispatch — verifies that agent_request() in the
orchestrator service correctly intercepts subagent completion messages and
routes them to _handle_subagent_completion.
"""

import pytest
from unittest.mock import MagicMock, AsyncMock, patch

from trustgraph.schema import AgentRequest, AgentStep

from trustgraph.agent.orchestrator.aggregator import Aggregator


def _make_request(**kwargs):
    defaults = dict(
        question="Test question",
        collection="default",
    )
    defaults.update(kwargs)
    return AgentRequest(**defaults)


def _make_completion_request(correlation_id, goal, answer):
    """Build a completion request as emit_subagent_completion would."""
    step = AgentStep(
        thought="Subagent completed",
        action="complete",
        arguments={},
        observation=answer,
        step_type="subagent-completion",
    )
    return _make_request(
        correlation_id=correlation_id,
        parent_session_id="parent-sess",
        subagent_goal=goal,
        expected_siblings=2,
        history=[step],
    )


class TestCompletionDetection:
    """Test that completion messages are correctly identified."""

    def test_is_completion_when_correlation_id_and_step_type(self):
        req = _make_completion_request("corr-1", "goal-a", "answer-a")

        has_correlation = bool(getattr(req, 'correlation_id', ''))
        is_completion = any(
            getattr(h, 'step_type', '') == 'subagent-completion'
            for h in req.history
        )

        assert has_correlation
        assert is_completion

    def test_not_completion_without_correlation_id(self):
        step = AgentStep(
            step_type="subagent-completion",
            observation="answer",
        )
        req = _make_request(
            correlation_id="",
            history=[step],
        )

        has_correlation = bool(getattr(req, 'correlation_id', ''))
        assert not has_correlation

    def test_not_completion_without_step_type(self):
        step = AgentStep(
            step_type="react",
            observation="answer",
        )
        req = _make_request(
            correlation_id="corr-1",
            history=[step],
        )

        is_completion = any(
            getattr(h, 'step_type', '') == 'subagent-completion'
            for h in req.history
        )
        assert not is_completion

    def test_not_completion_with_empty_history(self):
        req = _make_request(
            correlation_id="corr-1",
            history=[],
        )
        assert not req.history


class TestAggregatorIntegration:
    """Test the aggregator flow as used by _handle_subagent_completion."""

    def test_full_completion_flow(self):
        """Simulates the flow: register, record completions, build synthesis."""
        agg = Aggregator()
        template = _make_request(
            question="Original question",
            streaming=True,
            task_type="risk-assessment",
            framing="Assess risks",
            session_id="parent-sess",
        )

        # Register fan-out
        agg.register_fanout("corr-1", "parent-sess", 2,
                            request_template=template)

        # First completion — not all done
        all_done = agg.record_completion(
            "corr-1", "goal-a", "answer-a",
        )
        assert all_done is False

        # Second completion — all done
        all_done = agg.record_completion(
            "corr-1", "goal-b", "answer-b",
        )
        assert all_done is True

        # Peek at template
        peeked = agg.get_original_request("corr-1")
        assert peeked.question == "Original question"

        # Build synthesis request
        synth = agg.build_synthesis_request(
            "corr-1",
            original_question="Original question",
            collection="default",
        )

        # Verify synthesis request
        assert synth.pattern == "supervisor"
        assert synth.correlation_id == ""
        assert synth.session_id == "parent-sess"
        assert synth.streaming is True

        # Verify synthesis history has results
        synth_steps = [
            s for s in synth.history
            if getattr(s, 'step_type', '') == 'synthesise'
        ]
        assert len(synth_steps) == 1
        assert synth_steps[0].subagent_results == {
            "goal-a": "answer-a",
            "goal-b": "answer-b",
        }

    def test_synthesis_request_not_detected_as_completion(self):
        """The synthesis request must not be intercepted as a completion."""
        agg = Aggregator()
        template = _make_request(session_id="parent-sess")
        agg.register_fanout("corr-1", "parent-sess", 1,
                            request_template=template)
        agg.record_completion("corr-1", "goal", "answer")

        synth = agg.build_synthesis_request(
            "corr-1", "question", "default",
        )

        # correlation_id must be empty so it's not intercepted
        assert synth.correlation_id == ""

        # Even if we check for completion step, shouldn't match
        is_completion = any(
            getattr(h, 'step_type', '') == 'subagent-completion'
            for h in synth.history
        )
        assert not is_completion
Update tests for agent-orchestrator (#745) Add 96 tests covering the orchestrator's aggregation, provenance, routing, and explainability parsing. These verify the supervisor fan-out/fan-in lifecycle, the new RDF provenance types (Decomposition, Finding, Plan, StepResult, Synthesis), and their round-trip through the wire format. Unit tests (84): - Aggregator: register, record completion, peek, build synthesis, cleanup - Provenance triple builders: types, provenance links, goals/steps, labels - Explainability parsing: from_triples dispatch, field extraction for all new entity types, precedence over existing types - PatternBase: is_subagent detection, emit_subagent_completion message shape - Completion dispatch: detection logic, full aggregator integration flow, synthesis request not re-intercepted as completion - MetaRouter: task type identification, pattern selection, valid_patterns constraints, fallback on LLM error or unknown response Contract tests (12): - Orchestration fields on AgentRequest round-trip correctly - subagent-completion and synthesise step types in request history - Plan steps with status and dependencies - Provenance triple builder → wire format → from_triples round-trip for all five new entity types 2026-03-31 13:12:26 +01:00			`"""`
			`Unit tests for completion dispatch — verifies that agent_request() in the`
			`orchestrator service correctly intercepts subagent completion messages and`
			`routes them to _handle_subagent_completion.`
			`"""`

			`import pytest`
			`from unittest.mock import MagicMock, AsyncMock, patch`

			`from trustgraph.schema import AgentRequest, AgentStep`

			`from trustgraph.agent.orchestrator.aggregator import Aggregator`


			`def _make_request(**kwargs):`
			`defaults = dict(`
			`question="Test question",`
			`collection="default",`
			`)`
			`defaults.update(kwargs)`
			`return AgentRequest(**defaults)`


			`def _make_completion_request(correlation_id, goal, answer):`
			`"""Build a completion request as emit_subagent_completion would."""`
			`step = AgentStep(`
			`thought="Subagent completed",`
			`action="complete",`
			`arguments={},`
			`observation=answer,`
			`step_type="subagent-completion",`
			`)`
			`return _make_request(`
			`correlation_id=correlation_id,`
			`parent_session_id="parent-sess",`
			`subagent_goal=goal,`
			`expected_siblings=2,`
			`history=[step],`
			`)`


			`class TestCompletionDetection:`
			`"""Test that completion messages are correctly identified."""`

			`def test_is_completion_when_correlation_id_and_step_type(self):`
			`req = _make_completion_request("corr-1", "goal-a", "answer-a")`

			`has_correlation = bool(getattr(req, 'correlation_id', ''))`
			`is_completion = any(`
			`getattr(h, 'step_type', '') == 'subagent-completion'`
			`for h in req.history`
			`)`

			`assert has_correlation`
			`assert is_completion`

			`def test_not_completion_without_correlation_id(self):`
			`step = AgentStep(`
			`step_type="subagent-completion",`
			`observation="answer",`
			`)`
			`req = _make_request(`
			`correlation_id="",`
			`history=[step],`
			`)`

			`has_correlation = bool(getattr(req, 'correlation_id', ''))`
			`assert not has_correlation`

			`def test_not_completion_without_step_type(self):`
			`step = AgentStep(`
			`step_type="react",`
			`observation="answer",`
			`)`
			`req = _make_request(`
			`correlation_id="corr-1",`
			`history=[step],`
			`)`

			`is_completion = any(`
			`getattr(h, 'step_type', '') == 'subagent-completion'`
			`for h in req.history`
			`)`
			`assert not is_completion`

			`def test_not_completion_with_empty_history(self):`
			`req = _make_request(`
			`correlation_id="corr-1",`
			`history=[],`
			`)`
			`assert not req.history`


			`class TestAggregatorIntegration:`
			`"""Test the aggregator flow as used by _handle_subagent_completion."""`

			`def test_full_completion_flow(self):`
			`"""Simulates the flow: register, record completions, build synthesis."""`
			`agg = Aggregator()`
			`template = _make_request(`
			`question="Original question",`
			`streaming=True,`
			`task_type="risk-assessment",`
			`framing="Assess risks",`
			`session_id="parent-sess",`
			`)`

			`# Register fan-out`
			`agg.register_fanout("corr-1", "parent-sess", 2,`
			`request_template=template)`

			`# First completion — not all done`
			`all_done = agg.record_completion(`
			`"corr-1", "goal-a", "answer-a",`
			`)`
			`assert all_done is False`

			`# Second completion — all done`
			`all_done = agg.record_completion(`
			`"corr-1", "goal-b", "answer-b",`
			`)`
			`assert all_done is True`

			`# Peek at template`
			`peeked = agg.get_original_request("corr-1")`
			`assert peeked.question == "Original question"`

			`# Build synthesis request`
			`synth = agg.build_synthesis_request(`
			`"corr-1",`
			`original_question="Original question",`
			`collection="default",`
			`)`

			`# Verify synthesis request`
			`assert synth.pattern == "supervisor"`
			`assert synth.correlation_id == ""`
			`assert synth.session_id == "parent-sess"`
			`assert synth.streaming is True`

			`# Verify synthesis history has results`
			`synth_steps = [`
			`s for s in synth.history`
			`if getattr(s, 'step_type', '') == 'synthesise'`
			`]`
			`assert len(synth_steps) == 1`
			`assert synth_steps[0].subagent_results == {`
			`"goal-a": "answer-a",`
			`"goal-b": "answer-b",`
			`}`

			`def test_synthesis_request_not_detected_as_completion(self):`
			`"""The synthesis request must not be intercepted as a completion."""`
			`agg = Aggregator()`
			`template = _make_request(session_id="parent-sess")`
			`agg.register_fanout("corr-1", "parent-sess", 1,`
			`request_template=template)`
			`agg.record_completion("corr-1", "goal", "answer")`

			`synth = agg.build_synthesis_request(`
feat: workspace-based multi-tenancy, replacing user as tenancy axis (#840) Introduces `workspace` as the isolation boundary for config, flows, library, and knowledge data. Removes `user` as a schema-level field throughout the code, API specs, and tests; workspace provides the same separation more cleanly at the trusted flow.workspace layer rather than through client-supplied message fields. Design ------ - IAM tech spec (docs/tech-specs/iam.md) documents current state, proposed auth/access model, and migration direction. - Data ownership model (docs/tech-specs/data-ownership-model.md) captures the workspace/collection/flow hierarchy. Schema + messaging ------------------ - Drop `user` field from AgentRequest/Step, GraphRagQuery, DocumentRagQuery, Triples/Graph/Document/Row EmbeddingsRequest, Sparql/Rows/Structured QueryRequest, ToolServiceRequest. - Keep collection/workspace routing via flow.workspace at the service layer. - Translators updated to not serialise/deserialise user. API specs --------- - OpenAPI schemas and path examples cleaned of user fields. - Websocket async-api messages updated. - Removed the unused parameters/User.yaml. Services + base --------------- - Librarian, collection manager, knowledge, config: all operations scoped by workspace. Config client API takes workspace as first positional arg. - `flow.workspace` set at flow start time by the infrastructure; no longer pass-through from clients. - Tool service drops user-personalisation passthrough. CLI + SDK --------- - tg-init-workspace and workspace-aware import/export. - All tg-* commands drop user args; accept --workspace. - Python API/SDK (flow, socket_client, async_, explainability, library) drop user kwargs from every method signature. MCP server ---------- - All tool endpoints drop user parameters; socket_manager no longer keyed per user. Flow service ------------ - Closure-based topic cleanup on flow stop: only delete topics whose blueprint template was parameterised AND no remaining live flow (across all workspaces) still resolves to that topic. Three scopes fall out naturally from template analysis: {id} -> per-flow, deleted on stop * {blueprint} -> per-blueprint, kept while any flow of the same blueprint exists * {workspace} -> per-workspace, kept while any flow in the workspace exists * literal -> global, never deleted (e.g. tg.request.librarian) Fixes a bug where stopping a flow silently destroyed the global librarian exchange, wedging all library operations until manual restart. RabbitMQ backend ---------------- - heartbeat=60, blocked_connection_timeout=300. Catches silently dead connections (broker restart, orphaned channels, network partitions) within ~2 heartbeat windows, so the consumer reconnects and re-binds its queue rather than sitting forever on a zombie connection. Tests ----- - Full test refresh: unit, integration, contract, provenance. - Dropped user-field assertions and constructor kwargs across ~100 test files. - Renamed user-collection isolation tests to workspace-collection. 2026-04-21 23:23:01 +01:00			`"corr-1", "question", "default",`
Update tests for agent-orchestrator (#745) Add 96 tests covering the orchestrator's aggregation, provenance, routing, and explainability parsing. These verify the supervisor fan-out/fan-in lifecycle, the new RDF provenance types (Decomposition, Finding, Plan, StepResult, Synthesis), and their round-trip through the wire format. Unit tests (84): - Aggregator: register, record completion, peek, build synthesis, cleanup - Provenance triple builders: types, provenance links, goals/steps, labels - Explainability parsing: from_triples dispatch, field extraction for all new entity types, precedence over existing types - PatternBase: is_subagent detection, emit_subagent_completion message shape - Completion dispatch: detection logic, full aggregator integration flow, synthesis request not re-intercepted as completion - MetaRouter: task type identification, pattern selection, valid_patterns constraints, fallback on LLM error or unknown response Contract tests (12): - Orchestration fields on AgentRequest round-trip correctly - subagent-completion and synthesise step types in request history - Plan steps with status and dependencies - Provenance triple builder → wire format → from_triples round-trip for all five new entity types 2026-03-31 13:12:26 +01:00			`)`

			`# correlation_id must be empty so it's not intercepted`
			`assert synth.correlation_id == ""`

			`# Even if we check for completion step, shouldn't match`
			`is_completion = any(`
			`getattr(h, 'step_type', '') == 'subagent-completion'`
			`for h in synth.history`
			`)`
			`assert not is_completion`