Release 1.4 -> master (#524)

Catch up
2026-06-15 01:35:13 +02:00 · 2025-09-20 16:00:37 +01:00 · 2025-09-20 16:00:37 +01:00 · 6c7af8789d
commit 6c7af8789d
parent a8e437fc7f
216 changed files with 31360 additions and 1611 deletions
--- a/tests/unit/test_base/test_cassandra_config.py
+++ b/tests/unit/test_base/test_cassandra_config.py
@ -0,0 +1,412 @@
+"""
+Unit tests for Cassandra configuration helper module.
+
+Tests configuration resolution, environment variable handling,
+command-line argument parsing, and backward compatibility.
+"""
+
+import argparse
+import os
+import pytest
+from unittest.mock import patch
+
+from trustgraph.base.cassandra_config import (
+    get_cassandra_defaults,
+    add_cassandra_args,
+    resolve_cassandra_config,
+    get_cassandra_config_from_params
+)
+
+
+class TestGetCassandraDefaults:
+    """Test the get_cassandra_defaults function."""
+    
+    def test_defaults_with_no_env_vars(self):
+        """Test defaults when no environment variables are set."""
+        with patch.dict(os.environ, {}, clear=True):
+            defaults = get_cassandra_defaults()
+            
+            assert defaults['host'] == 'cassandra'
+            assert defaults['username'] is None
+            assert defaults['password'] is None
+    
+    def test_defaults_with_env_vars(self):
+        """Test defaults when environment variables are set."""
+        env_vars = {
+            'CASSANDRA_HOST': 'env-host1,env-host2',
+            'CASSANDRA_USERNAME': 'env-user',
+            'CASSANDRA_PASSWORD': 'env-pass'
+        }
+        
+        with patch.dict(os.environ, env_vars, clear=True):
+            defaults = get_cassandra_defaults()
+            
+            assert defaults['host'] == 'env-host1,env-host2'
+            assert defaults['username'] == 'env-user'
+            assert defaults['password'] == 'env-pass'
+    
+    def test_partial_env_vars(self):
+        """Test defaults when only some environment variables are set."""
+        env_vars = {
+            'CASSANDRA_HOST': 'partial-host',
+            'CASSANDRA_USERNAME': 'partial-user'
+            # CASSANDRA_PASSWORD not set
+        }
+        
+        with patch.dict(os.environ, env_vars, clear=True):
+            defaults = get_cassandra_defaults()
+            
+            assert defaults['host'] == 'partial-host'
+            assert defaults['username'] == 'partial-user'
+            assert defaults['password'] is None
+
+
+class TestAddCassandraArgs:
+    """Test the add_cassandra_args function."""
+    
+    def test_basic_args_added(self):
+        """Test that all three arguments are added to parser."""
+        parser = argparse.ArgumentParser()
+        add_cassandra_args(parser)
+        
+        # Parse empty args to check defaults
+        args = parser.parse_args([])
+        
+        assert hasattr(args, 'cassandra_host')
+        assert hasattr(args, 'cassandra_username')
+        assert hasattr(args, 'cassandra_password')
+    
+    def test_help_text_no_env_vars(self):
+        """Test help text when no environment variables are set."""
+        with patch.dict(os.environ, {}, clear=True):
+            parser = argparse.ArgumentParser()
+            add_cassandra_args(parser)
+            
+            help_text = parser.format_help()
+            
+            assert 'Cassandra host list, comma-separated (default:' in help_text
+            assert 'cassandra)' in help_text
+            assert 'Cassandra username' in help_text
+            assert 'Cassandra password' in help_text
+            assert '[from CASSANDRA_HOST]' not in help_text
+    
+    def test_help_text_with_env_vars(self):
+        """Test help text when environment variables are set."""
+        env_vars = {
+            'CASSANDRA_HOST': 'help-host1,help-host2',
+            'CASSANDRA_USERNAME': 'help-user',
+            'CASSANDRA_PASSWORD': 'help-pass'
+        }
+        
+        with patch.dict(os.environ, env_vars, clear=True):
+            parser = argparse.ArgumentParser()
+            add_cassandra_args(parser)
+            
+            help_text = parser.format_help()
+            
+            # Help text may have line breaks - argparse breaks long lines
+            # So check for the components that should be there
+            assert 'help-' in help_text and 'host1' in help_text
+            assert 'help-host2' in help_text
+            # Check key components (may be split across lines by argparse)
+            assert '[from CASSANDRA_HOST]' in help_text
+            assert '(default: help-user)' in help_text
+            assert '[from' in help_text and 'CASSANDRA_USERNAME]' in help_text
+            assert '(default: <set>)' in help_text  # Password hidden
+            assert '[from' in help_text and 'CASSANDRA_PASSWORD]' in help_text
+            assert 'help-pass' not in help_text  # Password value not shown
+    
+    def test_command_line_override(self):
+        """Test that command-line arguments override environment variables."""
+        env_vars = {
+            'CASSANDRA_HOST': 'env-host',
+            'CASSANDRA_USERNAME': 'env-user',
+            'CASSANDRA_PASSWORD': 'env-pass'
+        }
+        
+        with patch.dict(os.environ, env_vars, clear=True):
+            parser = argparse.ArgumentParser()
+            add_cassandra_args(parser)
+            
+            args = parser.parse_args([
+                '--cassandra-host', 'cli-host',
+                '--cassandra-username', 'cli-user',
+                '--cassandra-password', 'cli-pass'
+            ])
+            
+            assert args.cassandra_host == 'cli-host'
+            assert args.cassandra_username == 'cli-user'
+            assert args.cassandra_password == 'cli-pass'
+
+
+class TestResolveCassandraConfig:
+    """Test the resolve_cassandra_config function."""
+    
+    def test_default_configuration(self):
+        """Test resolution with no parameters or environment variables."""
+        with patch.dict(os.environ, {}, clear=True):
+            hosts, username, password = resolve_cassandra_config()
+            
+            assert hosts == ['cassandra']
+            assert username is None
+            assert password is None
+    
+    def test_environment_variable_resolution(self):
+        """Test resolution from environment variables."""
+        env_vars = {
+            'CASSANDRA_HOST': 'env1,env2,env3',
+            'CASSANDRA_USERNAME': 'env-user',
+            'CASSANDRA_PASSWORD': 'env-pass'
+        }
+        
+        with patch.dict(os.environ, env_vars, clear=True):
+            hosts, username, password = resolve_cassandra_config()
+            
+            assert hosts == ['env1', 'env2', 'env3']
+            assert username == 'env-user'
+            assert password == 'env-pass'
+    
+    def test_explicit_parameter_override(self):
+        """Test that explicit parameters override environment variables."""
+        env_vars = {
+            'CASSANDRA_HOST': 'env-host',
+            'CASSANDRA_USERNAME': 'env-user',
+            'CASSANDRA_PASSWORD': 'env-pass'
+        }
+        
+        with patch.dict(os.environ, env_vars, clear=True):
+            hosts, username, password = resolve_cassandra_config(
+                host='explicit-host',
+                username='explicit-user',
+                password='explicit-pass'
+            )
+            
+            assert hosts == ['explicit-host']
+            assert username == 'explicit-user'
+            assert password == 'explicit-pass'
+    
+    def test_host_list_parsing(self):
+        """Test different host list formats."""
+        # Single host
+        hosts, _, _ = resolve_cassandra_config(host='single-host')
+        assert hosts == ['single-host']
+        
+        # Multiple hosts with spaces
+        hosts, _, _ = resolve_cassandra_config(host='host1, host2 ,host3')
+        assert hosts == ['host1', 'host2', 'host3']
+        
+        # Empty elements filtered out
+        hosts, _, _ = resolve_cassandra_config(host='host1,,host2,')
+        assert hosts == ['host1', 'host2']
+        
+        # Already a list
+        hosts, _, _ = resolve_cassandra_config(host=['list-host1', 'list-host2'])
+        assert hosts == ['list-host1', 'list-host2']
+    
+    def test_args_object_resolution(self):
+        """Test resolution from argparse args object."""
+        # Mock args object
+        class MockArgs:
+            cassandra_host = 'args-host1,args-host2'
+            cassandra_username = 'args-user'
+            cassandra_password = 'args-pass'
+        
+        args = MockArgs()
+        hosts, username, password = resolve_cassandra_config(args)
+        
+        assert hosts == ['args-host1', 'args-host2']
+        assert username == 'args-user'
+        assert password == 'args-pass'
+    
+    def test_partial_args_with_env_fallback(self):
+        """Test args object with missing attributes falls back to environment."""
+        env_vars = {
+            'CASSANDRA_HOST': 'env-host',
+            'CASSANDRA_USERNAME': 'env-user',
+            'CASSANDRA_PASSWORD': 'env-pass'
+        }
+        
+        # Args object with only some attributes
+        class PartialArgs:
+            cassandra_host = 'args-host'
+            # Missing cassandra_username and cassandra_password
+        
+        with patch.dict(os.environ, env_vars, clear=True):
+            args = PartialArgs()
+            hosts, username, password = resolve_cassandra_config(args)
+            
+            assert hosts == ['args-host']  # From args
+            assert username == 'env-user'  # From env
+            assert password == 'env-pass'  # From env
+
+
+class TestGetCassandraConfigFromParams:
+    """Test the get_cassandra_config_from_params function."""
+    
+    def test_new_parameter_names(self):
+        """Test with new cassandra_* parameter names."""
+        params = {
+            'cassandra_host': 'new-host1,new-host2',
+            'cassandra_username': 'new-user',
+            'cassandra_password': 'new-pass'
+        }
+        
+        hosts, username, password = get_cassandra_config_from_params(params)
+        
+        assert hosts == ['new-host1', 'new-host2']
+        assert username == 'new-user'
+        assert password == 'new-pass'
+    
+    def test_no_backward_compatibility_graph_params(self):
+        """Test that old graph_* parameter names are no longer supported."""
+        params = {
+            'graph_host': 'old-host',
+            'graph_username': 'old-user',
+            'graph_password': 'old-pass'
+        }
+        
+        hosts, username, password = get_cassandra_config_from_params(params)
+        
+        # Should use defaults since graph_* params are not recognized
+        assert hosts == ['cassandra']  # Default
+        assert username is None
+        assert password is None
+    
+    def test_no_old_cassandra_user_compatibility(self):
+        """Test that cassandra_user is no longer supported (must be cassandra_username)."""
+        params = {
+            'cassandra_host': 'compat-host',
+            'cassandra_user': 'compat-user',  # Old name - not supported
+            'cassandra_password': 'compat-pass'
+        }
+        
+        hosts, username, password = get_cassandra_config_from_params(params)
+        
+        assert hosts == ['compat-host']
+        assert username is None  # cassandra_user is not recognized
+        assert password == 'compat-pass'
+    
+    def test_only_new_parameters_work(self):
+        """Test that only new parameter names are recognized."""
+        params = {
+            'cassandra_host': 'new-host',
+            'graph_host': 'old-host',
+            'cassandra_username': 'new-user',
+            'graph_username': 'old-user',
+            'cassandra_user': 'older-user',
+            'cassandra_password': 'new-pass',
+            'graph_password': 'old-pass'
+        }
+        
+        hosts, username, password = get_cassandra_config_from_params(params)
+        
+        assert hosts == ['new-host']  # Only cassandra_* params work
+        assert username == 'new-user'  # Only cassandra_* params work
+        assert password == 'new-pass'  # Only cassandra_* params work
+    
+    def test_empty_params_with_env_fallback(self):
+        """Test that empty params falls back to environment variables."""
+        env_vars = {
+            'CASSANDRA_HOST': 'fallback-host1,fallback-host2',
+            'CASSANDRA_USERNAME': 'fallback-user',
+            'CASSANDRA_PASSWORD': 'fallback-pass'
+        }
+        
+        with patch.dict(os.environ, env_vars, clear=True):
+            params = {}
+            hosts, username, password = get_cassandra_config_from_params(params)
+            
+            assert hosts == ['fallback-host1', 'fallback-host2']
+            assert username == 'fallback-user'
+            assert password == 'fallback-pass'
+
+
+class TestConfigurationPriority:
+    """Test the overall configuration priority: CLI > env vars > defaults."""
+    
+    def test_full_priority_chain(self):
+        """Test complete priority chain with all sources present."""
+        env_vars = {
+            'CASSANDRA_HOST': 'env-host',
+            'CASSANDRA_USERNAME': 'env-user',
+            'CASSANDRA_PASSWORD': 'env-pass'
+        }
+        
+        with patch.dict(os.environ, env_vars, clear=True):
+            # CLI args should override everything
+            hosts, username, password = resolve_cassandra_config(
+                host='cli-host',
+                username='cli-user',
+                password='cli-pass'
+            )
+            
+            assert hosts == ['cli-host']
+            assert username == 'cli-user'
+            assert password == 'cli-pass'
+    
+    def test_partial_cli_with_env_fallback(self):
+        """Test partial CLI args with environment variable fallback."""
+        env_vars = {
+            'CASSANDRA_HOST': 'env-host',
+            'CASSANDRA_USERNAME': 'env-user',
+            'CASSANDRA_PASSWORD': 'env-pass'
+        }
+        
+        with patch.dict(os.environ, env_vars, clear=True):
+            # Only provide host via CLI
+            hosts, username, password = resolve_cassandra_config(
+                host='cli-host'
+                # username and password not provided
+            )
+            
+            assert hosts == ['cli-host']      # From CLI
+            assert username == 'env-user'    # From env
+            assert password == 'env-pass'    # From env
+    
+    def test_no_config_defaults(self):
+        """Test that defaults are used when no configuration is provided."""
+        with patch.dict(os.environ, {}, clear=True):
+            hosts, username, password = resolve_cassandra_config()
+            
+            assert hosts == ['cassandra']  # Default
+            assert username is None       # Default
+            assert password is None       # Default
+
+
+class TestEdgeCases:
+    """Test edge cases and error conditions."""
+    
+    def test_empty_host_string(self):
+        """Test handling of empty host string falls back to default."""
+        hosts, _, _ = resolve_cassandra_config(host='')
+        assert hosts == ['cassandra']  # Falls back to default
+    
+    def test_whitespace_only_host(self):
+        """Test handling of whitespace-only host string."""
+        hosts, _, _ = resolve_cassandra_config(host='   ')
+        assert hosts == []  # Empty after stripping whitespace
+    
+    def test_none_values_preserved(self):
+        """Test that None values are preserved correctly."""
+        hosts, username, password = resolve_cassandra_config(
+            host=None,
+            username=None,
+            password=None
+        )
+        
+        # Should fall back to defaults
+        assert hosts == ['cassandra']
+        assert username is None
+        assert password is None
+    
+    def test_mixed_none_and_values(self):
+        """Test mixing None and actual values."""
+        hosts, username, password = resolve_cassandra_config(
+            host='mixed-host',
+            username=None,
+            password='mixed-pass'
+        )
+        
+        assert hosts == ['mixed-host']
+        assert username is None  # Stays None
+        assert password == 'mixed-pass'
--- a/tests/unit/test_base/test_document_embeddings_client.py
+++ b/tests/unit/test_base/test_document_embeddings_client.py
@ -0,0 +1,190 @@
+"""
+Unit tests for trustgraph.base.document_embeddings_client
+Testing async document embeddings client functionality
+"""
+
+import pytest
+from unittest.mock import AsyncMock, MagicMock, patch
+from unittest import IsolatedAsyncioTestCase
+
+from trustgraph.base.document_embeddings_client import DocumentEmbeddingsClient, DocumentEmbeddingsClientSpec
+from trustgraph.schema import DocumentEmbeddingsRequest, DocumentEmbeddingsResponse, Error
+
+
+class TestDocumentEmbeddingsClient(IsolatedAsyncioTestCase):
+    """Test async document embeddings client functionality"""
+
+    @patch('trustgraph.base.request_response_spec.RequestResponse.__init__')
+    async def test_query_success_with_chunks(self, mock_parent_init):
+        """Test successful query returning chunks"""
+        # Arrange
+        mock_parent_init.return_value = None
+        client = DocumentEmbeddingsClient()
+        mock_response = MagicMock(spec=DocumentEmbeddingsResponse)
+        mock_response.error = None
+        mock_response.chunks = ["chunk1", "chunk2", "chunk3"]
+        
+        # Mock the request method
+        client.request = AsyncMock(return_value=mock_response)
+        
+        vectors = [[0.1, 0.2, 0.3], [0.4, 0.5, 0.6]]
+        
+        # Act
+        result = await client.query(
+            vectors=vectors,
+            limit=10,
+            user="test_user",
+            collection="test_collection",
+            timeout=30
+        )
+        
+        # Assert
+        assert result == ["chunk1", "chunk2", "chunk3"]
+        client.request.assert_called_once()
+        call_args = client.request.call_args[0][0]
+        assert isinstance(call_args, DocumentEmbeddingsRequest)
+        assert call_args.vectors == vectors
+        assert call_args.limit == 10
+        assert call_args.user == "test_user"
+        assert call_args.collection == "test_collection"
+
+    @patch('trustgraph.base.request_response_spec.RequestResponse.__init__')
+    async def test_query_with_error_raises_exception(self, mock_parent_init):
+        """Test query raises RuntimeError when response contains error"""
+        # Arrange
+        mock_parent_init.return_value = None
+        client = DocumentEmbeddingsClient()
+        mock_response = MagicMock(spec=DocumentEmbeddingsResponse)
+        mock_response.error = MagicMock()
+        mock_response.error.message = "Database connection failed"
+        
+        client.request = AsyncMock(return_value=mock_response)
+        
+        # Act & Assert
+        with pytest.raises(RuntimeError, match="Database connection failed"):
+            await client.query(
+                vectors=[[0.1, 0.2, 0.3]],
+                limit=5
+            )
+
+    @patch('trustgraph.base.request_response_spec.RequestResponse.__init__')
+    async def test_query_with_empty_chunks(self, mock_parent_init):
+        """Test query with empty chunks list"""
+        # Arrange
+        mock_parent_init.return_value = None
+        client = DocumentEmbeddingsClient()
+        mock_response = MagicMock(spec=DocumentEmbeddingsResponse)
+        mock_response.error = None
+        mock_response.chunks = []
+        
+        client.request = AsyncMock(return_value=mock_response)
+        
+        # Act
+        result = await client.query(vectors=[[0.1, 0.2, 0.3]])
+        
+        # Assert
+        assert result == []
+
+    @patch('trustgraph.base.request_response_spec.RequestResponse.__init__')
+    async def test_query_with_default_parameters(self, mock_parent_init):
+        """Test query uses correct default parameters"""
+        # Arrange
+        mock_parent_init.return_value = None
+        client = DocumentEmbeddingsClient()
+        mock_response = MagicMock(spec=DocumentEmbeddingsResponse)
+        mock_response.error = None
+        mock_response.chunks = ["test_chunk"]
+        
+        client.request = AsyncMock(return_value=mock_response)
+        
+        # Act
+        result = await client.query(vectors=[[0.1, 0.2, 0.3]])
+        
+        # Assert
+        client.request.assert_called_once()
+        call_args = client.request.call_args[0][0]
+        assert call_args.limit == 20  # Default limit
+        assert call_args.user == "trustgraph"  # Default user
+        assert call_args.collection == "default"  # Default collection
+
+    @patch('trustgraph.base.request_response_spec.RequestResponse.__init__')
+    async def test_query_with_custom_timeout(self, mock_parent_init):
+        """Test query passes custom timeout to request"""
+        # Arrange
+        mock_parent_init.return_value = None
+        client = DocumentEmbeddingsClient()
+        mock_response = MagicMock(spec=DocumentEmbeddingsResponse)
+        mock_response.error = None
+        mock_response.chunks = ["chunk1"]
+        
+        client.request = AsyncMock(return_value=mock_response)
+        
+        # Act
+        await client.query(
+            vectors=[[0.1, 0.2, 0.3]],
+            timeout=60
+        )
+        
+        # Assert
+        assert client.request.call_args[1]["timeout"] == 60
+
+    @patch('trustgraph.base.request_response_spec.RequestResponse.__init__')
+    async def test_query_logging(self, mock_parent_init):
+        """Test query logs response for debugging"""
+        # Arrange
+        mock_parent_init.return_value = None
+        client = DocumentEmbeddingsClient()
+        mock_response = MagicMock(spec=DocumentEmbeddingsResponse)
+        mock_response.error = None
+        mock_response.chunks = ["test_chunk"]
+        
+        client.request = AsyncMock(return_value=mock_response)
+        
+        # Act
+        with patch('trustgraph.base.document_embeddings_client.logger') as mock_logger:
+            result = await client.query(vectors=[[0.1, 0.2, 0.3]])
+            
+            # Assert
+            mock_logger.debug.assert_called_once()
+            assert "Document embeddings response" in str(mock_logger.debug.call_args)
+            assert result == ["test_chunk"]
+
+
+class TestDocumentEmbeddingsClientSpec(IsolatedAsyncioTestCase):
+    """Test DocumentEmbeddingsClientSpec configuration"""
+
+    def test_spec_initialization(self):
+        """Test DocumentEmbeddingsClientSpec initialization"""
+        # Act
+        spec = DocumentEmbeddingsClientSpec(
+            request_name="test-request",
+            response_name="test-response"
+        )
+        
+        # Assert
+        assert spec.request_name == "test-request"
+        assert spec.response_name == "test-response"
+        assert spec.request_schema == DocumentEmbeddingsRequest
+        assert spec.response_schema == DocumentEmbeddingsResponse
+        assert spec.impl == DocumentEmbeddingsClient
+
+    @patch('trustgraph.base.request_response_spec.RequestResponseSpec.__init__')
+    def test_spec_calls_parent_init(self, mock_parent_init):
+        """Test spec properly calls parent class initialization"""
+        # Arrange
+        mock_parent_init.return_value = None
+        
+        # Act
+        spec = DocumentEmbeddingsClientSpec(
+            request_name="test-request",
+            response_name="test-response"
+        )
+        
+        # Assert
+        mock_parent_init.assert_called_once_with(
+            request_name="test-request",
+            request_schema=DocumentEmbeddingsRequest,
+            response_name="test-response",
+            response_schema=DocumentEmbeddingsResponse,
+            impl=DocumentEmbeddingsClient
+        )
--- a/tests/unit/test_base/test_publisher_graceful_shutdown.py
+++ b/tests/unit/test_base/test_publisher_graceful_shutdown.py
@ -0,0 +1,330 @@
+"""Unit tests for Publisher graceful shutdown functionality."""
+
+import pytest
+import asyncio
+import time
+from unittest.mock import AsyncMock, MagicMock, patch
+from trustgraph.base.publisher import Publisher
+
+
+@pytest.fixture
+def mock_pulsar_client():
+    """Mock Pulsar client for testing."""
+    client = MagicMock()
+    producer = AsyncMock()
+    producer.send = MagicMock()
+    producer.flush = MagicMock()
+    producer.close = MagicMock()
+    client.create_producer.return_value = producer
+    return client
+
+
+@pytest.fixture
+def publisher(mock_pulsar_client):
+    """Create Publisher instance for testing."""
+    return Publisher(
+        client=mock_pulsar_client,
+        topic="test-topic",
+        schema=dict,
+        max_size=10,
+        drain_timeout=2.0
+    )
+
+
+@pytest.mark.asyncio
+async def test_publisher_queue_drain():
+    """Verify Publisher drains queue on shutdown."""
+    mock_client = MagicMock()
+    mock_producer = MagicMock()
+    mock_client.create_producer.return_value = mock_producer
+    
+    publisher = Publisher(
+        client=mock_client,
+        topic="test-topic", 
+        schema=dict,
+        max_size=10,
+        drain_timeout=1.0  # Shorter timeout for testing
+    )
+    
+    # Don't start the actual run loop - just test the drain logic
+    # Fill queue with messages directly
+    for i in range(5):
+        await publisher.q.put((f"id-{i}", {"data": i}))
+    
+    # Verify queue has messages
+    assert not publisher.q.empty()
+    
+    # Mock the producer creation in run() method by patching
+    with patch.object(publisher, 'run') as mock_run:
+        # Create a realistic run implementation that processes the queue
+        async def mock_run_impl():
+            # Simulate the actual run logic for drain
+            producer = mock_producer
+            while not publisher.q.empty():
+                try:
+                    id, item = await asyncio.wait_for(publisher.q.get(), timeout=0.1)
+                    producer.send(item, {"id": id})
+                except asyncio.TimeoutError:
+                    break
+            producer.flush()
+            producer.close()
+        
+        mock_run.side_effect = mock_run_impl
+        
+        # Start and stop publisher
+        await publisher.start()
+        await publisher.stop()
+    
+    # Verify all messages were sent
+    assert publisher.q.empty()
+    assert mock_producer.send.call_count == 5
+    mock_producer.flush.assert_called_once()
+    mock_producer.close.assert_called_once()
+
+
+@pytest.mark.asyncio
+async def test_publisher_rejects_messages_during_drain():
+    """Verify Publisher rejects new messages during shutdown."""
+    mock_client = MagicMock()
+    mock_producer = MagicMock()
+    mock_client.create_producer.return_value = mock_producer
+    
+    publisher = Publisher(
+        client=mock_client,
+        topic="test-topic",
+        schema=dict,
+        max_size=10,
+        drain_timeout=1.0
+    )
+    
+    # Don't start the actual run loop
+    # Add one message directly
+    await publisher.q.put(("id-1", {"data": 1}))
+    
+    # Start shutdown process manually
+    publisher.running = False
+    publisher.draining = True
+    
+    # Try to send message during drain
+    with pytest.raises(RuntimeError, match="Publisher is shutting down"):
+        await publisher.send("id-2", {"data": 2})
+
+
+@pytest.mark.asyncio
+async def test_publisher_drain_timeout():
+    """Verify Publisher respects drain timeout."""
+    mock_client = MagicMock()
+    mock_producer = MagicMock()
+    mock_client.create_producer.return_value = mock_producer
+    
+    publisher = Publisher(
+        client=mock_client,
+        topic="test-topic",
+        schema=dict,
+        max_size=10,
+        drain_timeout=0.2  # Short timeout for testing
+    )
+    
+    # Fill queue with many messages directly
+    for i in range(10):
+        await publisher.q.put((f"id-{i}", {"data": i}))
+    
+    # Mock slow message processing
+    def slow_send(*args, **kwargs):
+        time.sleep(0.1)  # Simulate slow send
+    
+    mock_producer.send.side_effect = slow_send
+    
+    with patch.object(publisher, 'run') as mock_run:
+        # Create a run implementation that respects timeout
+        async def mock_run_with_timeout():
+            producer = mock_producer
+            end_time = time.time() + publisher.drain_timeout
+            
+            while not publisher.q.empty() and time.time() < end_time:
+                try:
+                    id, item = await asyncio.wait_for(publisher.q.get(), timeout=0.05)
+                    producer.send(item, {"id": id})
+                except asyncio.TimeoutError:
+                    break
+            
+            producer.flush()
+            producer.close()
+        
+        mock_run.side_effect = mock_run_with_timeout
+        
+        start_time = time.time()
+        await publisher.start()
+        await publisher.stop()
+        end_time = time.time()
+    
+    # Should timeout quickly
+    assert end_time - start_time < 1.0
+    
+    # Should have called flush and close even with timeout
+    mock_producer.flush.assert_called_once()
+    mock_producer.close.assert_called_once()
+
+
+@pytest.mark.asyncio
+async def test_publisher_successful_drain():
+    """Verify Publisher drains successfully under normal conditions."""
+    mock_client = MagicMock()
+    mock_producer = MagicMock()
+    mock_client.create_producer.return_value = mock_producer
+    
+    publisher = Publisher(
+        client=mock_client,
+        topic="test-topic",
+        schema=dict,
+        max_size=10,
+        drain_timeout=2.0
+    )
+    
+    # Add messages directly to queue
+    messages = []
+    for i in range(3):
+        msg = {"data": i}
+        await publisher.q.put((f"id-{i}", msg))
+        messages.append(msg)
+    
+    with patch.object(publisher, 'run') as mock_run:
+        # Create a successful drain implementation
+        async def mock_successful_drain():
+            producer = mock_producer
+            processed = []
+            
+            while not publisher.q.empty():
+                id, item = await publisher.q.get()
+                producer.send(item, {"id": id})
+                processed.append((id, item))
+            
+            producer.flush()
+            producer.close()
+            return processed
+        
+        mock_run.side_effect = mock_successful_drain
+        
+        await publisher.start()
+        await publisher.stop()
+    
+    # All messages should be sent
+    assert publisher.q.empty()
+    assert mock_producer.send.call_count == 3
+    
+    # Verify correct messages were sent
+    sent_calls = mock_producer.send.call_args_list
+    for i, call in enumerate(sent_calls):
+        args, kwargs = call
+        assert args[0] == {"data": i}  # message content
+        # Note: kwargs format depends on how send was called in mock
+        # Just verify message was sent with correct content
+
+
+@pytest.mark.asyncio
+async def test_publisher_state_transitions():
+    """Test Publisher state transitions during graceful shutdown."""
+    mock_client = MagicMock()
+    mock_producer = MagicMock()
+    mock_client.create_producer.return_value = mock_producer
+    
+    publisher = Publisher(
+        client=mock_client,
+        topic="test-topic",
+        schema=dict,
+        max_size=10,
+        drain_timeout=1.0
+    )
+    
+    # Initial state
+    assert publisher.running is True
+    assert publisher.draining is False
+    
+    # Add message directly
+    await publisher.q.put(("id-1", {"data": 1}))
+    
+    with patch.object(publisher, 'run') as mock_run:
+        # Mock run that simulates state transitions
+        async def mock_run_with_states():
+            # Simulate drain process
+            publisher.running = False
+            publisher.draining = True
+            
+            # Process messages
+            while not publisher.q.empty():
+                id, item = await publisher.q.get()
+                mock_producer.send(item, {"id": id})
+            
+            # Complete drain
+            publisher.draining = False
+            mock_producer.flush()
+            mock_producer.close()
+        
+        mock_run.side_effect = mock_run_with_states
+        
+        await publisher.start()
+        await publisher.stop()
+    
+    # Should have completed all state transitions
+    assert publisher.running is False
+    assert publisher.draining is False
+    mock_producer.send.assert_called_once()
+    mock_producer.flush.assert_called_once()
+    mock_producer.close.assert_called_once()
+
+
+@pytest.mark.asyncio
+async def test_publisher_exception_handling():
+    """Test Publisher handles exceptions during drain gracefully."""
+    mock_client = MagicMock()
+    mock_producer = MagicMock()
+    mock_client.create_producer.return_value = mock_producer
+    
+    # Mock producer.send to raise exception on second call
+    call_count = 0
+    def failing_send(*args, **kwargs):
+        nonlocal call_count
+        call_count += 1
+        if call_count == 2:
+            raise Exception("Send failed")
+    
+    mock_producer.send.side_effect = failing_send
+    
+    publisher = Publisher(
+        client=mock_client,
+        topic="test-topic",
+        schema=dict,
+        max_size=10,
+        drain_timeout=1.0
+    )
+    
+    # Add messages directly
+    await publisher.q.put(("id-1", {"data": 1}))
+    await publisher.q.put(("id-2", {"data": 2}))
+    
+    with patch.object(publisher, 'run') as mock_run:
+        # Mock run that handles exceptions gracefully
+        async def mock_run_with_exceptions():
+            producer = mock_producer
+            
+            while not publisher.q.empty():
+                try:
+                    id, item = await publisher.q.get()
+                    producer.send(item, {"id": id})
+                except Exception as e:
+                    # Log exception but continue processing
+                    continue
+            
+            # Always call flush and close
+            producer.flush()
+            producer.close()
+        
+        mock_run.side_effect = mock_run_with_exceptions
+        
+        await publisher.start()
+        await publisher.stop()
+    
+    # Should have attempted to send both messages
+    assert mock_producer.send.call_count == 2
+    mock_producer.flush.assert_called_once()
+    mock_producer.close.assert_called_once()
--- a/tests/unit/test_base/test_subscriber_graceful_shutdown.py
+++ b/tests/unit/test_base/test_subscriber_graceful_shutdown.py
@ -0,0 +1,382 @@
+"""Unit tests for Subscriber graceful shutdown functionality."""
+
+import pytest
+import asyncio
+import uuid
+from unittest.mock import AsyncMock, MagicMock, patch
+from trustgraph.base.subscriber import Subscriber
+
+# Mock JsonSchema globally to avoid schema issues in tests  
+# Patch at the module level where it's imported in subscriber
+@patch('trustgraph.base.subscriber.JsonSchema')
+def mock_json_schema_global(mock_schema):
+    mock_schema.return_value = MagicMock()
+    return mock_schema
+
+# Apply the global patch
+_json_schema_patch = patch('trustgraph.base.subscriber.JsonSchema')
+_mock_json_schema = _json_schema_patch.start()
+_mock_json_schema.return_value = MagicMock()
+
+
+@pytest.fixture
+def mock_pulsar_client():
+    """Mock Pulsar client for testing."""
+    client = MagicMock()
+    consumer = MagicMock()
+    consumer.receive = MagicMock()
+    consumer.acknowledge = MagicMock()
+    consumer.negative_acknowledge = MagicMock()
+    consumer.pause_message_listener = MagicMock()
+    consumer.unsubscribe = MagicMock()
+    consumer.close = MagicMock()
+    client.subscribe.return_value = consumer
+    return client
+
+
+@pytest.fixture
+def subscriber(mock_pulsar_client):
+    """Create Subscriber instance for testing."""
+    return Subscriber(
+        client=mock_pulsar_client,
+        topic="test-topic",
+        subscription="test-subscription",
+        consumer_name="test-consumer",
+        schema=dict,
+        max_size=10,
+        drain_timeout=2.0,
+        backpressure_strategy="block"
+    )
+
+
+def create_mock_message(message_id="test-id", data=None):
+    """Create a mock Pulsar message."""
+    msg = MagicMock()
+    msg.properties.return_value = {"id": message_id}
+    msg.value.return_value = data or {"test": "data"}
+    return msg
+
+
+@pytest.mark.asyncio
+async def test_subscriber_deferred_acknowledgment_success():
+    """Verify Subscriber only acks on successful delivery."""
+    mock_client = MagicMock()
+    mock_consumer = MagicMock()
+    mock_client.subscribe.return_value = mock_consumer
+    
+    subscriber = Subscriber(
+        client=mock_client,
+        topic="test-topic",
+        subscription="test-subscription", 
+        consumer_name="test-consumer",
+        schema=dict,
+        max_size=10,
+        backpressure_strategy="block"
+    )
+    
+    # Start subscriber to initialize consumer
+    await subscriber.start()
+    
+    # Create queue for subscription
+    queue = await subscriber.subscribe("test-queue")
+    
+    # Create mock message with matching queue name
+    msg = create_mock_message("test-queue", {"data": "test"})
+    
+    # Process message
+    await subscriber._process_message(msg)
+    
+    # Should acknowledge successful delivery
+    mock_consumer.acknowledge.assert_called_once_with(msg)
+    mock_consumer.negative_acknowledge.assert_not_called()
+    
+    # Message should be in queue
+    assert not queue.empty()
+    received_msg = await queue.get()
+    assert received_msg == {"data": "test"}
+    
+    # Clean up
+    await subscriber.stop()
+
+
+@pytest.mark.asyncio
+async def test_subscriber_deferred_acknowledgment_failure():
+    """Verify Subscriber negative acks on delivery failure."""
+    mock_client = MagicMock()
+    mock_consumer = MagicMock()
+    mock_client.subscribe.return_value = mock_consumer
+    
+    subscriber = Subscriber(
+        client=mock_client,
+        topic="test-topic",
+        subscription="test-subscription",
+        consumer_name="test-consumer", 
+        schema=dict,
+        max_size=1,  # Very small queue
+        backpressure_strategy="drop_new"
+    )
+    
+    # Start subscriber to initialize consumer
+    await subscriber.start()
+    
+    # Create queue and fill it
+    queue = await subscriber.subscribe("test-queue")
+    await queue.put({"existing": "data"})
+    
+    # Create mock message - should be dropped
+    msg = create_mock_message("msg-1", {"data": "test"})
+    
+    # Process message (should fail due to full queue + drop_new strategy)
+    await subscriber._process_message(msg)
+    
+    # Should negative acknowledge failed delivery
+    mock_consumer.negative_acknowledge.assert_called_once_with(msg)
+    mock_consumer.acknowledge.assert_not_called()
+    
+    # Clean up
+    await subscriber.stop()
+
+
+@pytest.mark.asyncio
+async def test_subscriber_backpressure_strategies():
+    """Test different backpressure strategies."""
+    mock_client = MagicMock()
+    mock_consumer = MagicMock()
+    mock_client.subscribe.return_value = mock_consumer
+    
+    # Test drop_oldest strategy
+    subscriber = Subscriber(
+        client=mock_client,
+        topic="test-topic", 
+        subscription="test-subscription",
+        consumer_name="test-consumer",
+        schema=dict,
+        max_size=2,
+        backpressure_strategy="drop_oldest"
+    )
+    
+    # Start subscriber to initialize consumer
+    await subscriber.start()
+    
+    queue = await subscriber.subscribe("test-queue")
+    
+    # Fill queue
+    await queue.put({"data": "old1"})
+    await queue.put({"data": "old2"})
+    
+    # Add new message (should drop oldest) - use matching queue name
+    msg = create_mock_message("test-queue", {"data": "new"})
+    await subscriber._process_message(msg)
+    
+    # Should acknowledge delivery
+    mock_consumer.acknowledge.assert_called_once_with(msg)
+    
+    # Queue should have new message (old one dropped)
+    messages = []
+    while not queue.empty():
+        messages.append(await queue.get())
+    
+    # Should contain old2 and new (old1 was dropped)
+    assert len(messages) == 2
+    assert {"data": "new"} in messages
+    
+    # Clean up
+    await subscriber.stop()
+
+
+@pytest.mark.asyncio
+async def test_subscriber_graceful_shutdown():
+    """Test Subscriber graceful shutdown with queue draining."""
+    mock_client = MagicMock()
+    mock_consumer = MagicMock()
+    mock_client.subscribe.return_value = mock_consumer
+    
+    subscriber = Subscriber(
+        client=mock_client,
+        topic="test-topic",
+        subscription="test-subscription",
+        consumer_name="test-consumer",
+        schema=dict,
+        max_size=10,
+        drain_timeout=1.0
+    )
+    
+    # Create subscription with messages before starting
+    queue = await subscriber.subscribe("test-queue")
+    await queue.put({"data": "msg1"})
+    await queue.put({"data": "msg2"})
+    
+    with patch.object(subscriber, 'run') as mock_run:
+        # Mock run that simulates graceful shutdown
+        async def mock_run_graceful():
+            # Process messages while running, then drain
+            while subscriber.running or subscriber.draining:
+                if subscriber.draining:
+                    # Simulate pause message listener
+                    mock_consumer.pause_message_listener()
+                    # Drain messages
+                    while not queue.empty():
+                        await queue.get()
+                    break
+                await asyncio.sleep(0.05)
+            
+            # Cleanup
+            mock_consumer.unsubscribe()
+            mock_consumer.close()
+        
+        mock_run.side_effect = mock_run_graceful
+        
+        await subscriber.start()
+        
+        # Initial state
+        assert subscriber.running is True
+        assert subscriber.draining is False
+        
+        # Start shutdown
+        stop_task = asyncio.create_task(subscriber.stop())
+        
+        # Allow brief processing
+        await asyncio.sleep(0.1)
+        
+        # Should be in drain state
+        assert subscriber.running is False
+        assert subscriber.draining is True
+        
+        # Complete shutdown
+        await stop_task
+        
+        # Should have cleaned up
+        mock_consumer.unsubscribe.assert_called_once()
+        mock_consumer.close.assert_called_once()
+
+
+@pytest.mark.asyncio
+async def test_subscriber_drain_timeout():
+    """Test Subscriber respects drain timeout."""
+    mock_client = MagicMock()
+    mock_consumer = MagicMock()
+    mock_client.subscribe.return_value = mock_consumer
+    
+    subscriber = Subscriber(
+        client=mock_client,
+        topic="test-topic",
+        subscription="test-subscription", 
+        consumer_name="test-consumer",
+        schema=dict,
+        max_size=10,
+        drain_timeout=0.1  # Very short timeout
+    )
+    
+    # Create subscription with many messages
+    queue = await subscriber.subscribe("test-queue")
+    # Fill queue to max capacity (subscriber max_size=10, but queue itself has maxsize=10)
+    for i in range(5):  # Fill partway to avoid blocking
+        await queue.put({"data": f"msg{i}"})
+    
+    # Test the timeout behavior without actually running start/stop
+    # Just verify the timeout value is set correctly and queue has messages
+    assert subscriber.drain_timeout == 0.1
+    assert not queue.empty()
+    assert queue.qsize() == 5
+    
+    # Simulate what would happen during timeout - queue should still have messages
+    # This tests the concept without the complex async interaction
+    messages_remaining = queue.qsize()
+    assert messages_remaining > 0  # Should have messages that would timeout
+
+
+@pytest.mark.asyncio
+async def test_subscriber_pending_acks_cleanup():
+    """Test Subscriber cleans up pending acknowledgments on shutdown."""
+    mock_client = MagicMock()
+    mock_consumer = MagicMock()
+    mock_client.subscribe.return_value = mock_consumer
+    
+    subscriber = Subscriber(
+        client=mock_client,
+        topic="test-topic",
+        subscription="test-subscription",
+        consumer_name="test-consumer",
+        schema=dict,
+        max_size=10
+    )
+    
+    # Add pending acknowledgments manually (simulating in-flight messages)
+    msg1 = create_mock_message("msg-1")
+    msg2 = create_mock_message("msg-2") 
+    subscriber.pending_acks["ack-1"] = msg1
+    subscriber.pending_acks["ack-2"] = msg2
+    
+    with patch.object(subscriber, 'run') as mock_run:
+        # Mock run that simulates cleanup of pending acks
+        async def mock_run_cleanup():
+            while subscriber.running or subscriber.draining:
+                await asyncio.sleep(0.05)
+                if subscriber.draining:
+                    break
+            
+            # Simulate cleanup in finally block
+            for msg in subscriber.pending_acks.values():
+                mock_consumer.negative_acknowledge(msg)
+            subscriber.pending_acks.clear()
+            
+            mock_consumer.unsubscribe()
+            mock_consumer.close()
+        
+        mock_run.side_effect = mock_run_cleanup
+        
+        await subscriber.start()
+        
+        # Stop subscriber
+        await subscriber.stop()
+        
+        # Should negative acknowledge pending messages
+        assert mock_consumer.negative_acknowledge.call_count == 2
+        mock_consumer.negative_acknowledge.assert_any_call(msg1)
+        mock_consumer.negative_acknowledge.assert_any_call(msg2)
+        
+        # Pending acks should be cleared
+        assert len(subscriber.pending_acks) == 0
+
+
+@pytest.mark.asyncio
+async def test_subscriber_multiple_subscribers():
+    """Test Subscriber with multiple concurrent subscribers."""
+    mock_client = MagicMock()
+    mock_consumer = MagicMock()
+    mock_client.subscribe.return_value = mock_consumer
+    
+    subscriber = Subscriber(
+        client=mock_client,
+        topic="test-topic",
+        subscription="test-subscription",
+        consumer_name="test-consumer",
+        schema=dict,
+        max_size=10
+    )
+    
+    # Manually set consumer to test without complex async interactions
+    subscriber.consumer = mock_consumer
+    
+    # Create multiple subscriptions
+    queue1 = await subscriber.subscribe("queue-1")
+    queue2 = await subscriber.subscribe("queue-2")
+    queue_all = await subscriber.subscribe_all("queue-all")
+    
+    # Process message - use queue-1 as the target
+    msg = create_mock_message("queue-1", {"data": "broadcast"})
+    await subscriber._process_message(msg)
+    
+    # Should acknowledge (successful delivery to all queues)
+    mock_consumer.acknowledge.assert_called_once_with(msg)
+    
+    # Message should be in specific queue (queue-1) and broadcast queue
+    assert not queue1.empty()
+    assert queue2.empty()  # No message for queue-2
+    assert not queue_all.empty()
+    
+    # Verify message content
+    msg1 = await queue1.get()
+    msg_all = await queue_all.get()
+    assert msg1 == {"data": "broadcast"}
+    assert msg_all == {"data": "broadcast"}