mirror of
https://github.com/trustgraph-ai/trustgraph.git
synced 2026-04-25 16:36:21 +02:00
Update tests for agent-orchestrator (#745)
Add 96 tests covering the orchestrator's aggregation, provenance, routing, and explainability parsing. These verify the supervisor fan-out/fan-in lifecycle, the new RDF provenance types (Decomposition, Finding, Plan, StepResult, Synthesis), and their round-trip through the wire format. Unit tests (84): - Aggregator: register, record completion, peek, build synthesis, cleanup - Provenance triple builders: types, provenance links, goals/steps, labels - Explainability parsing: from_triples dispatch, field extraction for all new entity types, precedence over existing types - PatternBase: is_subagent detection, emit_subagent_completion message shape - Completion dispatch: detection logic, full aggregator integration flow, synthesis request not re-intercepted as completion - MetaRouter: task type identification, pattern selection, valid_patterns constraints, fallback on LLM error or unknown response Contract tests (12): - Orchestration fields on AgentRequest round-trip correctly - subagent-completion and synthesise step types in request history - Plan steps with status and dependencies - Provenance triple builder → wire format → from_triples round-trip for all five new entity types
This commit is contained in:
parent
7b734148b3
commit
816a8cfcf6
8 changed files with 1517 additions and 0 deletions
174
tests/unit/test_agent/test_completion_dispatch.py
Normal file
174
tests/unit/test_agent/test_completion_dispatch.py
Normal file
|
|
@ -0,0 +1,174 @@
|
|||
"""
|
||||
Unit tests for completion dispatch — verifies that agent_request() in the
|
||||
orchestrator service correctly intercepts subagent completion messages and
|
||||
routes them to _handle_subagent_completion.
|
||||
"""
|
||||
|
||||
import pytest
|
||||
from unittest.mock import MagicMock, AsyncMock, patch
|
||||
|
||||
from trustgraph.schema import AgentRequest, AgentStep
|
||||
|
||||
from trustgraph.agent.orchestrator.aggregator import Aggregator
|
||||
|
||||
|
||||
def _make_request(**kwargs):
|
||||
defaults = dict(
|
||||
question="Test question",
|
||||
user="testuser",
|
||||
collection="default",
|
||||
)
|
||||
defaults.update(kwargs)
|
||||
return AgentRequest(**defaults)
|
||||
|
||||
|
||||
def _make_completion_request(correlation_id, goal, answer):
|
||||
"""Build a completion request as emit_subagent_completion would."""
|
||||
step = AgentStep(
|
||||
thought="Subagent completed",
|
||||
action="complete",
|
||||
arguments={},
|
||||
observation=answer,
|
||||
step_type="subagent-completion",
|
||||
)
|
||||
return _make_request(
|
||||
correlation_id=correlation_id,
|
||||
parent_session_id="parent-sess",
|
||||
subagent_goal=goal,
|
||||
expected_siblings=2,
|
||||
history=[step],
|
||||
)
|
||||
|
||||
|
||||
class TestCompletionDetection:
|
||||
"""Test that completion messages are correctly identified."""
|
||||
|
||||
def test_is_completion_when_correlation_id_and_step_type(self):
|
||||
req = _make_completion_request("corr-1", "goal-a", "answer-a")
|
||||
|
||||
has_correlation = bool(getattr(req, 'correlation_id', ''))
|
||||
is_completion = any(
|
||||
getattr(h, 'step_type', '') == 'subagent-completion'
|
||||
for h in req.history
|
||||
)
|
||||
|
||||
assert has_correlation
|
||||
assert is_completion
|
||||
|
||||
def test_not_completion_without_correlation_id(self):
|
||||
step = AgentStep(
|
||||
step_type="subagent-completion",
|
||||
observation="answer",
|
||||
)
|
||||
req = _make_request(
|
||||
correlation_id="",
|
||||
history=[step],
|
||||
)
|
||||
|
||||
has_correlation = bool(getattr(req, 'correlation_id', ''))
|
||||
assert not has_correlation
|
||||
|
||||
def test_not_completion_without_step_type(self):
|
||||
step = AgentStep(
|
||||
step_type="react",
|
||||
observation="answer",
|
||||
)
|
||||
req = _make_request(
|
||||
correlation_id="corr-1",
|
||||
history=[step],
|
||||
)
|
||||
|
||||
is_completion = any(
|
||||
getattr(h, 'step_type', '') == 'subagent-completion'
|
||||
for h in req.history
|
||||
)
|
||||
assert not is_completion
|
||||
|
||||
def test_not_completion_with_empty_history(self):
|
||||
req = _make_request(
|
||||
correlation_id="corr-1",
|
||||
history=[],
|
||||
)
|
||||
assert not req.history
|
||||
|
||||
|
||||
class TestAggregatorIntegration:
|
||||
"""Test the aggregator flow as used by _handle_subagent_completion."""
|
||||
|
||||
def test_full_completion_flow(self):
|
||||
"""Simulates the flow: register, record completions, build synthesis."""
|
||||
agg = Aggregator()
|
||||
template = _make_request(
|
||||
question="Original question",
|
||||
streaming=True,
|
||||
task_type="risk-assessment",
|
||||
framing="Assess risks",
|
||||
session_id="parent-sess",
|
||||
)
|
||||
|
||||
# Register fan-out
|
||||
agg.register_fanout("corr-1", "parent-sess", 2,
|
||||
request_template=template)
|
||||
|
||||
# First completion — not all done
|
||||
all_done = agg.record_completion(
|
||||
"corr-1", "goal-a", "answer-a",
|
||||
)
|
||||
assert all_done is False
|
||||
|
||||
# Second completion — all done
|
||||
all_done = agg.record_completion(
|
||||
"corr-1", "goal-b", "answer-b",
|
||||
)
|
||||
assert all_done is True
|
||||
|
||||
# Peek at template
|
||||
peeked = agg.get_original_request("corr-1")
|
||||
assert peeked.question == "Original question"
|
||||
|
||||
# Build synthesis request
|
||||
synth = agg.build_synthesis_request(
|
||||
"corr-1",
|
||||
original_question="Original question",
|
||||
user="testuser",
|
||||
collection="default",
|
||||
)
|
||||
|
||||
# Verify synthesis request
|
||||
assert synth.pattern == "supervisor"
|
||||
assert synth.correlation_id == ""
|
||||
assert synth.session_id == "parent-sess"
|
||||
assert synth.streaming is True
|
||||
|
||||
# Verify synthesis history has results
|
||||
synth_steps = [
|
||||
s for s in synth.history
|
||||
if getattr(s, 'step_type', '') == 'synthesise'
|
||||
]
|
||||
assert len(synth_steps) == 1
|
||||
assert synth_steps[0].subagent_results == {
|
||||
"goal-a": "answer-a",
|
||||
"goal-b": "answer-b",
|
||||
}
|
||||
|
||||
def test_synthesis_request_not_detected_as_completion(self):
|
||||
"""The synthesis request must not be intercepted as a completion."""
|
||||
agg = Aggregator()
|
||||
template = _make_request(session_id="parent-sess")
|
||||
agg.register_fanout("corr-1", "parent-sess", 1,
|
||||
request_template=template)
|
||||
agg.record_completion("corr-1", "goal", "answer")
|
||||
|
||||
synth = agg.build_synthesis_request(
|
||||
"corr-1", "question", "user", "default",
|
||||
)
|
||||
|
||||
# correlation_id must be empty so it's not intercepted
|
||||
assert synth.correlation_id == ""
|
||||
|
||||
# Even if we check for completion step, shouldn't match
|
||||
is_completion = any(
|
||||
getattr(h, 'step_type', '') == 'subagent-completion'
|
||||
for h in synth.history
|
||||
)
|
||||
assert not is_completion
|
||||
Loading…
Add table
Add a link
Reference in a new issue