mirror of
https://github.com/trustgraph-ai/trustgraph.git
synced 2026-04-26 00:46:22 +02:00
Adds a RabbitMQ backend as an alternative to Pulsar, selectable via PUBSUB_BACKEND=rabbitmq. Both backends implement the same PubSubBackend protocol — no application code changes needed to switch. RabbitMQ topology: - Single topic exchange per topicspace (e.g. 'tg') - Routing key derived from queue class and topic name - Shared consumers: named queue bound to exchange (competing, round-robin) - Exclusive consumers: anonymous auto-delete queue (broadcast, each gets every message). Used by Subscriber and config push consumer. - Thread-local producer connections (pika is not thread-safe) - Push-based consumption via basic_consume with process_data_events for heartbeat processing Consumer model changes: - Consumer class creates one backend consumer per concurrent task (required for pika thread safety, harmless for Pulsar) - Consumer class accepts consumer_type parameter - Subscriber passes consumer_type='exclusive' for broadcast semantics - Config push consumer uses consumer_type='exclusive' so every processor instance receives config updates - handle_one_from_queue receives consumer as parameter for correct per-connection ack/nack LibrarianClient: - New shared client class replacing duplicated librarian request-response code across 6+ services (chunking, decoders, RAG, etc.) - Uses stream-document instead of get-document-content for fetching document content in 1MB chunks (avoids broker message size limits) - Standalone object (self.librarian = LibrarianClient(...)) not a mixin - get-document-content marked deprecated in schema and OpenAPI spec Serialisation: - Extracted dataclass_to_dict/dict_to_dataclass to shared serialization.py (used by both Pulsar and RabbitMQ backends) Librarian queues: - Changed from flow class (persistent) back to request/response class now that stream-document eliminates large single messages - API upload chunk size reduced from 5MB to 3MB to stay under broker limits after base64 encoding Factory and CLI: - get_pubsub() handles 'rabbitmq' backend with RabbitMQ connection params - add_pubsub_args() includes RabbitMQ options (host, port, credentials) - add_pubsub_args(standalone=True) defaults to localhost for CLI tools - init_trustgraph skips Pulsar admin setup for non-Pulsar backends - tg-dump-queues and tg-monitor-prompts use backend abstraction - BaseClient and ConfigClient accept generic pubsub config
164 lines
5.7 KiB
Python
164 lines
5.7 KiB
Python
"""
|
|
Tests for queue naming and topic mapping.
|
|
"""
|
|
|
|
import pytest
|
|
import argparse
|
|
|
|
from trustgraph.schema.core.topic import queue
|
|
from trustgraph.base.pubsub import get_pubsub, add_pubsub_args
|
|
from trustgraph.base.pulsar_backend import PulsarBackend
|
|
|
|
|
|
class TestQueueFunction:
|
|
|
|
def test_flow_default(self):
|
|
assert queue('text-completion-request') == 'flow:tg:text-completion-request'
|
|
|
|
def test_request_class(self):
|
|
assert queue('config', cls='request') == 'request:tg:config'
|
|
|
|
def test_response_class(self):
|
|
assert queue('config', cls='response') == 'response:tg:config'
|
|
|
|
def test_state_class(self):
|
|
assert queue('config', cls='state') == 'state:tg:config'
|
|
|
|
def test_custom_topicspace(self):
|
|
assert queue('config', cls='request', topicspace='prod') == 'request:prod:config'
|
|
|
|
def test_default_class_is_flow(self):
|
|
result = queue('something')
|
|
assert result.startswith('flow:')
|
|
|
|
|
|
class TestPulsarMapTopic:
|
|
|
|
@pytest.fixture
|
|
def backend(self):
|
|
"""Create a PulsarBackend without connecting."""
|
|
b = object.__new__(PulsarBackend)
|
|
return b
|
|
|
|
def test_flow_maps_to_persistent(self, backend):
|
|
assert backend.map_topic('flow:tg:text-completion-request') == \
|
|
'persistent://tg/flow/text-completion-request'
|
|
|
|
def test_state_maps_to_persistent(self, backend):
|
|
assert backend.map_topic('state:tg:config') == \
|
|
'persistent://tg/state/config'
|
|
|
|
def test_request_maps_to_non_persistent(self, backend):
|
|
assert backend.map_topic('request:tg:config') == \
|
|
'non-persistent://tg/request/config'
|
|
|
|
def test_response_maps_to_non_persistent(self, backend):
|
|
assert backend.map_topic('response:tg:librarian') == \
|
|
'non-persistent://tg/response/librarian'
|
|
|
|
def test_passthrough_pulsar_uri(self, backend):
|
|
uri = 'persistent://tg/flow/something'
|
|
assert backend.map_topic(uri) == uri
|
|
|
|
def test_invalid_format_raises(self, backend):
|
|
with pytest.raises(ValueError, match="Invalid queue format"):
|
|
backend.map_topic('bad-format')
|
|
|
|
def test_invalid_class_raises(self, backend):
|
|
with pytest.raises(ValueError, match="Invalid queue class"):
|
|
backend.map_topic('unknown:tg:topic')
|
|
|
|
def test_custom_topicspace(self, backend):
|
|
assert backend.map_topic('flow:prod:my-queue') == \
|
|
'persistent://prod/flow/my-queue'
|
|
|
|
|
|
class TestGetPubsubDispatch:
|
|
|
|
def test_unknown_backend_raises(self):
|
|
with pytest.raises(ValueError, match="Unknown pub/sub backend"):
|
|
get_pubsub(pubsub_backend='redis')
|
|
|
|
|
|
class TestAddPubsubArgs:
|
|
|
|
def test_standalone_defaults_to_localhost(self):
|
|
parser = argparse.ArgumentParser()
|
|
add_pubsub_args(parser, standalone=True)
|
|
args = parser.parse_args([])
|
|
assert args.pulsar_host == 'pulsar://localhost:6650'
|
|
assert args.pulsar_listener == 'localhost'
|
|
|
|
def test_non_standalone_defaults_to_container(self):
|
|
parser = argparse.ArgumentParser()
|
|
add_pubsub_args(parser, standalone=False)
|
|
args = parser.parse_args([])
|
|
assert 'pulsar:6650' in args.pulsar_host
|
|
assert args.pulsar_listener is None
|
|
|
|
def test_cli_override_respected(self):
|
|
parser = argparse.ArgumentParser()
|
|
add_pubsub_args(parser, standalone=True)
|
|
args = parser.parse_args(['--pulsar-host', 'pulsar://custom:6650'])
|
|
assert args.pulsar_host == 'pulsar://custom:6650'
|
|
|
|
def test_pubsub_backend_default(self):
|
|
parser = argparse.ArgumentParser()
|
|
add_pubsub_args(parser)
|
|
args = parser.parse_args([])
|
|
assert args.pubsub_backend == 'pulsar'
|
|
|
|
|
|
class TestAddPubsubArgsRabbitMQ:
|
|
|
|
def test_rabbitmq_args_present(self):
|
|
parser = argparse.ArgumentParser()
|
|
add_pubsub_args(parser)
|
|
args = parser.parse_args([
|
|
'--pubsub-backend', 'rabbitmq',
|
|
'--rabbitmq-host', 'myhost',
|
|
'--rabbitmq-port', '5673',
|
|
])
|
|
assert args.pubsub_backend == 'rabbitmq'
|
|
assert args.rabbitmq_host == 'myhost'
|
|
assert args.rabbitmq_port == 5673
|
|
|
|
def test_rabbitmq_defaults_container(self):
|
|
parser = argparse.ArgumentParser()
|
|
add_pubsub_args(parser)
|
|
args = parser.parse_args([])
|
|
assert args.rabbitmq_host == 'rabbitmq'
|
|
assert args.rabbitmq_port == 5672
|
|
assert args.rabbitmq_username == 'guest'
|
|
assert args.rabbitmq_password == 'guest'
|
|
assert args.rabbitmq_vhost == '/'
|
|
|
|
def test_rabbitmq_standalone_defaults_to_localhost(self):
|
|
parser = argparse.ArgumentParser()
|
|
add_pubsub_args(parser, standalone=True)
|
|
args = parser.parse_args([])
|
|
assert args.rabbitmq_host == 'localhost'
|
|
|
|
|
|
class TestQueueDefinitions:
|
|
"""Verify the actual queue constants produce correct names."""
|
|
|
|
def test_config_request(self):
|
|
from trustgraph.schema.services.config import config_request_queue
|
|
assert config_request_queue == 'request:tg:config'
|
|
|
|
def test_config_response(self):
|
|
from trustgraph.schema.services.config import config_response_queue
|
|
assert config_response_queue == 'response:tg:config'
|
|
|
|
def test_config_push(self):
|
|
from trustgraph.schema.services.config import config_push_queue
|
|
assert config_push_queue == 'state:tg:config'
|
|
|
|
def test_librarian_request(self):
|
|
from trustgraph.schema.services.library import librarian_request_queue
|
|
assert librarian_request_queue == 'request:tg:librarian'
|
|
|
|
def test_knowledge_request(self):
|
|
from trustgraph.schema.knowledge.knowledge import knowledge_request_queue
|
|
assert knowledge_request_queue == 'request:tg:knowledge'
|