Release/v1.2 (#457)

* Bump setup.py versions for 1.1 * PoC MCP server (#419) * Very initial MCP server PoC for TrustGraph * Put service on port 8000 * Add MCP container and packages to buildout * Update docs for API/CLI changes in 1.0 (#421) * Update some API basics for the 0.23/1.0 API change * Add MCP container push (#425) * Add command args to the MCP server (#426) * Host and port parameters * Added websocket arg * More docs * MCP client support (#427) - MCP client service - Tool request/response schema - API gateway support for mcp-tool - Message translation for tool request & response - Make mcp-tool using configuration service for information about where the MCP services are. * Feature/react call mcp (#428) Key Features - MCP Tool Integration: Added core MCP tool support with ToolClientSpec and ToolClient classes - API Enhancement: New mcp_tool method for flow-specific tool invocation - CLI Tooling: New tg-invoke-mcp-tool command for testing MCP integration - React Agent Enhancement: Fixed and improved multi-tool invocation capabilities - Tool Management: Enhanced CLI for tool configuration and management Changes - Added MCP tool invocation to API with flow-specific integration - Implemented ToolClientSpec and ToolClient for tool call handling - Updated agent-manager-react to invoke MCP tools with configurable types - Enhanced CLI with new commands and improved help text - Added comprehensive documentation for new CLI commands - Improved tool configuration management Testing - Added tg-invoke-mcp-tool CLI command for isolated MCP integration testing - Enhanced agent capability to invoke multiple tools simultaneously * Test suite executed from CI pipeline (#433) * Test strategy & test cases * Unit tests * Integration tests * Extending test coverage (#434) * Contract tests * Testing embeedings * Agent unit tests * Knowledge pipeline tests * Turn on contract tests * Increase storage test coverage (#435) * Fixing storage and adding tests * PR pipeline only runs quick tests * Empty configuration is returned as empty list, previously was not in response (#436) * Update config util to take files as well as command-line text (#437) * Updated CLI invocation and config model for tools and mcp (#438) * Updated CLI invocation and config model for tools and mcp * CLI anomalies * Tweaked the MCP tool implementation for new model * Update agent implementation to match the new model * Fix agent tools, now all tested * Fixed integration tests * Fix MCP delete tool params * Update Python deps to 1.2 * Update to enable knowledge extraction using the agent framework (#439) * Implement KG extraction agent (kg-extract-agent) * Using ReAct framework (agent-manager-react) * ReAct manager had an issue when emitting JSON, which conflicts which ReAct manager's own JSON messages, so refactored ReAct manager to use traditional ReAct messages, non-JSON structure. * Minor refactor to take the prompt template client out of prompt-template so it can be more readily used by other modules. kg-extract-agent uses this framework. * Migrate from setup.py to pyproject.toml (#440) * Converted setup.py to pyproject.toml * Modern package infrastructure as recommended by py docs * Install missing build deps (#441) * Install missing build deps (#442) * Implement logging strategy (#444) * Logging strategy and convert all prints() to logging invocations * Fix/startup failure (#445) * Fix loggin startup problems * Fix logging startup problems (#446) * Fix logging startup problems (#447) * Fixed Mistral OCR to use current API (#448) * Fixed Mistral OCR to use current API * Added PDF decoder tests * Fix Mistral OCR ident to be standard pdf-decoder (#450) * Fix Mistral OCR ident to be standard pdf-decoder * Correct test * Schema structure refactor (#451) * Write schema refactor spec * Implemented schema refactor spec * Structure data mvp (#452) * Structured data tech spec * Architecture principles * New schemas * Updated schemas and specs * Object extractor * Add .coveragerc * New tests * Cassandra object storage * Trying to object extraction working, issues exist * Validate librarian collection (#453) * Fix token chunker, broken API invocation (#454) * Fix token chunker, broken API invocation (#455) * Knowledge load utility CLI (#456) * Knowledge loader * More tests
2026-04-26 17:06:22 +02:00 · 2025-08-18 20:56:09 +01:00 · 2025-08-18 20:56:09 +01:00 · 89be656990
commit 89be656990
parent c85ba197be
509 changed files with 49632 additions and 5159 deletions
--- a/trustgraph-base/trustgraph/base/init.py
+++ b/trustgraph-base/trustgraph/base/init.py
@ -28,4 +28,7 @@ from . triples_client import TriplesClientSpec
 from . document_embeddings_client import DocumentEmbeddingsClientSpec
 from . agent_service import AgentService
 from . graph_rag_client import GraphRagClientSpec
+from . tool_service import ToolService
+from . tool_client import ToolClientSpec
+from . agent_client import AgentClientSpec

--- a/trustgraph-base/trustgraph/base/agent_client.py
+++ b/trustgraph-base/trustgraph/base/agent_client.py
@ -4,9 +4,9 @@ from .. schema import AgentRequest, AgentResponse
 from .. knowledge import Uri, Literal

 class AgentClient(RequestResponse):
-    async def request(self, recipient, question, plan=None, state=None,
+    async def invoke(self, recipient, question, plan=None, state=None,
                    history=[], timeout=300):
-
+        
        resp = await self.request(
            AgentRequest(
                question = question,
@ -18,22 +18,20 @@ class AgentClient(RequestResponse):
            timeout=timeout,
        )

-        print(resp, flush=True)
-
        if resp.error:
            raise RuntimeError(resp.error.message)

-        return resp
+        return resp.answer

-class GraphEmbeddingsClientSpec(RequestResponseSpec):
+class AgentClientSpec(RequestResponseSpec):
    def __init__(
            self, request_name, response_name,
    ):
-        super(GraphEmbeddingsClientSpec, self).__init__(
+        super(AgentClientSpec, self).__init__(
            request_name = request_name,
-            request_schema = GraphEmbeddingsRequest,
+            request_schema = AgentRequest,
            response_name = response_name,
-            response_schema = GraphEmbeddingsResponse,
-            impl = GraphEmbeddingsClient,
+            response_schema = AgentResponse,
+            impl = AgentClient,
        )

--- a/trustgraph-base/trustgraph/base/agent_service.py
+++ b/trustgraph-base/trustgraph/base/agent_service.py
@ -4,12 +4,16 @@ Agent manager service completion base class
 """

 import time
+import logging
 from prometheus_client import Histogram

 from .. schema import AgentRequest, AgentResponse, Error
 from .. exceptions import TooManyRequests
 from .. base import FlowProcessor, ConsumerSpec, ProducerSpec

+# Module logger
+logger = logging.getLogger(__name__)
+
 default_ident = "agent-manager"

 class AgentService(FlowProcessor):
@ -76,9 +80,9 @@ class AgentService(FlowProcessor):
        except Exception as e:

            # Apart from rate limits, treat all exceptions as unrecoverable
-            print(f"on_request Exception: {e}")
+            logger.error(f"Exception in agent service on_request: {e}", exc_info=True)

-            print("Send error response...", flush=True)
+            logger.info("Sending error response...")

            await flow.producer["response"].send(
                AgentResponse(
--- a/trustgraph-base/trustgraph/base/async_processor.py
+++ b/trustgraph-base/trustgraph/base/async_processor.py
@ -9,6 +9,8 @@ import argparse
 import _pulsar
 import time
 import uuid
+import logging
+import os
 from prometheus_client import start_http_server, Info

 from .. schema import ConfigPush, config_push_queue
@ -20,6 +22,9 @@ from . metrics import ProcessorMetrics, ConsumerMetrics

 default_config_queue = config_push_queue

+# Module logger
+logger = logging.getLogger(__name__)
+
 # Async processor
 class AsyncProcessor:

@ -113,7 +118,7 @@ class AsyncProcessor:
        version = message.value().version

        # Invoke message handlers
-        print("Config change event", version, flush=True)
+        logger.info(f"Config change event: version={version}")
        for ch in self.config_handlers:
            await ch(config, version)

@ -156,9 +161,23 @@ class AsyncProcessor:

        # This is here to output a debug message, shouldn't be needed.
        except Exception as e:
-            print("Exception, closing taskgroup", flush=True)
+            logger.error("Exception, closing taskgroup", exc_info=True)
            raise e

+    @classmethod
+    def setup_logging(cls, log_level='INFO'):
+        """Configure logging for the entire application"""
+        # Support environment variable override
+        env_log_level = os.environ.get('TRUSTGRAPH_LOG_LEVEL', log_level)
+        
+        # Configure logging
+        logging.basicConfig(
+            level=getattr(logging, env_log_level.upper()),
+            format='%(asctime)s - %(name)s - %(levelname)s - %(message)s',
+            handlers=[logging.StreamHandler()]
+        )
+        logger.info(f"Logging configured with level: {env_log_level}")
+
    # Startup fabric.  launch calls launch_async in async mode.
    @classmethod
    def launch(cls, ident, doc):
@ -183,8 +202,11 @@ class AsyncProcessor:
        args = parser.parse_args()
        args = vars(args)

+        # Setup logging before anything else
+        cls.setup_logging(args.get('log_level', 'INFO').upper())
+
        # Debug
-        print(args, flush=True)
+        logger.debug(f"Arguments: {args}")

        # Start the Prometheus metrics service if needed
        if args["metrics"]:
@ -193,7 +215,7 @@ class AsyncProcessor:
        # Loop forever, exception handler
        while True:

-            print("Starting...", flush=True)
+            logger.info("Starting...")

            try:

@ -203,30 +225,30 @@ class AsyncProcessor:
                ))

            except KeyboardInterrupt:
-                print("Keyboard interrupt.", flush=True)
+                logger.info("Keyboard interrupt.")
                return

            except _pulsar.Interrupted:
-                print("Pulsar Interrupted.", flush=True)
+                logger.info("Pulsar Interrupted.")
                return

            # Exceptions from a taskgroup come in as an exception group
            except ExceptionGroup as e:

-                print("Exception group:", flush=True)
+                logger.error("Exception group:")

                for se in e.exceptions:
-                    print("  Type:", type(se), flush=True)
-                    print(f"  Exception: {se}", flush=True)
+                    logger.error(f"  Type: {type(se)}")
+                    logger.error(f"  Exception: {se}", exc_info=se)

            except Exception as e:
-                print("Type:", type(e), flush=True)
-                print("Exception:", e, flush=True)
+                logger.error(f"Type: {type(e)}")
+                logger.error(f"Exception: {e}", exc_info=True)

            # Retry occurs here
-            print("Will retry...", flush=True)
+            logger.warning("Will retry...")
            time.sleep(4)
-            print("Retrying...", flush=True)
+            logger.info("Retrying...")

    # The command-line arguments are built using a stack of add_args
    # invocations
@ -254,3 +276,4 @@ class AsyncProcessor:
            default=8000,
            help=f'Pulsar host (default: 8000)',
        )
+
--- a/trustgraph-base/trustgraph/base/consumer.py
+++ b/trustgraph-base/trustgraph/base/consumer.py
@ -14,9 +14,13 @@ import pulsar
 import _pulsar
 import asyncio
 import time
+import logging

 from .. exceptions import TooManyRequests

+# Module logger
+logger = logging.getLogger(__name__)
+
 class Consumer:

    def __init__(
@ -90,7 +94,7 @@ class Consumer:

            try:

-                print(self.topic, "subscribing...", flush=True)
+                logger.info(f"Subscribing to topic: {self.topic}")

                if self.start_of_messages:
                    pos = pulsar.InitialPosition.Earliest
@ -108,21 +112,18 @@ class Consumer:

            except Exception as e:

-                print("consumer subs Exception:", e, flush=True)
+                logger.error(f"Consumer subscription exception: {e}", exc_info=True)
                await asyncio.sleep(self.reconnect_time)
                continue

-            print(self.topic, "subscribed", flush=True)
+            logger.info(f"Successfully subscribed to topic: {self.topic}")

            if self.metrics:
                self.metrics.state("running")

            try:

-                print(
-                    "Starting", self.concurrency, "receiver threads",
-                    flush=True
-                )
+                logger.info(f"Starting {self.concurrency} receiver threads")

                async with asyncio.TaskGroup() as tg:

@ -138,7 +139,7 @@ class Consumer:

            except Exception as e:

-                print("consumer loop exception:", e, flush=True)
+                logger.error(f"Consumer loop exception: {e}", exc_info=True)
                self.consumer.unsubscribe()
                self.consumer.close()
                self.consumer = None
@ -174,7 +175,7 @@ class Consumer:

            if time.time() > expiry:

-                print("Gave up waiting for rate-limit retry", flush=True)
+                logger.warning("Gave up waiting for rate-limit retry")

                # Message failed to be processed, this causes it to
                # be retried
@ -188,7 +189,7 @@ class Consumer:

            try:

-                print("Handle...", flush=True)
+                logger.debug("Processing message...")

                if self.metrics:

@ -198,7 +199,7 @@ class Consumer:
                else:
                    await self.handler(msg, self, self.flow)

-                print("Handled.", flush=True)
+                logger.debug("Message processed successfully")

                # Acknowledge successful processing of the message
                self.consumer.acknowledge(msg)
@ -211,7 +212,7 @@ class Consumer:

            except TooManyRequests:

-                print("TooManyRequests: will retry...", flush=True)
+                logger.warning("Rate limit exceeded, will retry...")

                if self.metrics:
                    self.metrics.rate_limit()
@ -224,7 +225,7 @@ class Consumer:

            except Exception as e:

-                print("consume exception:", e, flush=True)
+                logger.error(f"Message processing exception: {e}", exc_info=True)

                # Message failed to be processed, this causes it to
                # be retried
--- a/trustgraph-base/trustgraph/base/document_embeddings_client.py
+++ b/trustgraph-base/trustgraph/base/document_embeddings_client.py
@ -1,8 +1,13 @@

+import logging
+
 from . request_response_spec import RequestResponse, RequestResponseSpec
 from .. schema import DocumentEmbeddingsRequest, DocumentEmbeddingsResponse
 from .. knowledge import Uri, Literal

+# Module logger
+logger = logging.getLogger(__name__)
+
 class DocumentEmbeddingsClient(RequestResponse):
    async def query(self, vectors, limit=20, user="trustgraph",
                    collection="default", timeout=30):
@ -17,7 +22,7 @@ class DocumentEmbeddingsClient(RequestResponse):
            timeout=timeout
        )

-        print(resp, flush=True)
+        logger.debug(f"Document embeddings response: {resp}")

        if resp.error:
            raise RuntimeError(resp.error.message)
--- a/trustgraph-base/trustgraph/base/document_embeddings_query_service.py
+++ b/trustgraph-base/trustgraph/base/document_embeddings_query_service.py
@ -4,6 +4,8 @@ Document embeddings query service.  Input is vectors.  Output is list of
 embeddings.
 """

+import logging
+
 from .. schema import DocumentEmbeddingsRequest, DocumentEmbeddingsResponse
 from .. schema import Error, Value

@ -11,6 +13,9 @@ from . flow_processor import FlowProcessor
 from . consumer_spec import ConsumerSpec
 from . producer_spec import ProducerSpec

+# Module logger
+logger = logging.getLogger(__name__)
+
 default_ident = "ge-query"

 class DocumentEmbeddingsQueryService(FlowProcessor):
@ -47,21 +52,21 @@ class DocumentEmbeddingsQueryService(FlowProcessor):
            # Sender-produced ID
            id = msg.properties()["id"]

-            print(f"Handling input {id}...", flush=True)
+            logger.debug(f"Handling document embeddings query request {id}...")

            docs = await self.query_document_embeddings(request)

-            print("Send response...", flush=True)
+            logger.debug("Sending document embeddings query response...")
            r = DocumentEmbeddingsResponse(documents=docs, error=None)
            await flow("response").send(r, properties={"id": id})

-            print("Done.", flush=True)
+            logger.debug("Document embeddings query request completed")

        except Exception as e:

-            print(f"Exception: {e}")
+            logger.error(f"Exception in document embeddings query service: {e}", exc_info=True)

-            print("Send error response...", flush=True)
+            logger.info("Sending error response...")

            r = DocumentEmbeddingsResponse(
                error=Error(
--- a/trustgraph-base/trustgraph/base/document_embeddings_store_service.py
+++ b/trustgraph-base/trustgraph/base/document_embeddings_store_service.py
@ -3,10 +3,15 @@
 Document embeddings store base class
 """

+import logging
+
 from .. schema import DocumentEmbeddings
 from .. base import FlowProcessor, ConsumerSpec
 from .. exceptions import TooManyRequests

+# Module logger
+logger = logging.getLogger(__name__)
+
 default_ident = "document-embeddings-write"

 class DocumentEmbeddingsStoreService(FlowProcessor):
@ -40,7 +45,7 @@ class DocumentEmbeddingsStoreService(FlowProcessor):

        except Exception as e:
            
-            print(f"Exception: {e}")
+            logger.error(f"Exception in document embeddings store service: {e}", exc_info=True)
            raise e

    @staticmethod
--- a/trustgraph-base/trustgraph/base/embeddings_service.py
+++ b/trustgraph-base/trustgraph/base/embeddings_service.py
@ -4,12 +4,16 @@ Embeddings resolution base class
 """

 import time
+import logging
 from prometheus_client import Histogram

 from .. schema import EmbeddingsRequest, EmbeddingsResponse, Error
 from .. exceptions import TooManyRequests
 from .. base import FlowProcessor, ConsumerSpec, ProducerSpec

+# Module logger
+logger = logging.getLogger(__name__)
+
 default_ident = "embeddings"
 default_concurrency = 1

@ -51,7 +55,7 @@ class EmbeddingsService(FlowProcessor):

            id = msg.properties()["id"]

-            print("Handling request", id, "...", flush=True)
+            logger.debug(f"Handling embeddings request {id}...")

            vectors = await self.on_embeddings(request.text)

@ -63,7 +67,7 @@ class EmbeddingsService(FlowProcessor):
                properties={"id": id}
            )

-            print("Handled.", flush=True)
+            logger.debug("Embeddings request handled successfully")

        except TooManyRequests as e:
            raise e
@ -72,9 +76,9 @@ class EmbeddingsService(FlowProcessor):

            # Apart from rate limits, treat all exceptions as unrecoverable

-            print(f"Exception: {e}", flush=True)
+            logger.error(f"Exception in embeddings service: {e}", exc_info=True)

-            print("Send error response...", flush=True)
+            logger.info("Sending error response...")

            await flow.producer["response"].send(
                EmbeddingsResponse(
--- a/trustgraph-base/trustgraph/base/flow_processor.py
+++ b/trustgraph-base/trustgraph/base/flow_processor.py
@ -4,6 +4,7 @@
 # configuration service which can't manage itself.

 import json
+import logging

 from pulsar.schema import JsonSchema

@ -14,6 +15,9 @@ from .. log_level import LogLevel
 from . async_processor import AsyncProcessor
 from . flow import Flow

+# Module logger
+logger = logging.getLogger(__name__)
+
 # Parent class for configurable processors, configured with flows by
 # the config service
 class FlowProcessor(AsyncProcessor):
@ -34,7 +38,7 @@ class FlowProcessor(AsyncProcessor):
        # Array of specifications: ConsumerSpec, ProducerSpec, SettingSpec
        self.specifications = []

-        print("Service initialised.")
+        logger.info("Service initialised.")

    # Register a configuration variable
    def register_specification(self, spec):
@ -44,19 +48,19 @@ class FlowProcessor(AsyncProcessor):
    async def start_flow(self, flow, defn):
        self.flows[flow] = Flow(self.id, flow, self, defn)
        await self.flows[flow].start()
-        print("Started flow: ", flow)
+        logger.info(f"Started flow: {flow}")
        
    # Stop processing for a new flow
    async def stop_flow(self, flow):
        if flow in self.flows:
            await self.flows[flow].stop()
            del self.flows[flow]
-            print("Stopped flow: ", flow, flush=True)
+            logger.info(f"Stopped flow: {flow}")

    # Event handler - called for a configuration change
    async def on_configure_flows(self, config, version):

-        print("Got config version", version, flush=True)
+        logger.info(f"Got config version {version}")

        # Skip over invalid data
        if "flows-active" not in config: return
@ -69,7 +73,7 @@ class FlowProcessor(AsyncProcessor):

        else:

-            print("No configuration settings for me.", flush=True)
+            logger.debug("No configuration settings for me.")
            flow_config = {}

        # Get list of flows which should be running and are currently
@ -88,7 +92,7 @@ class FlowProcessor(AsyncProcessor):
            if flow not in wanted_flows:
                await self.stop_flow(flow)

-        print("Handled config update")
+        logger.info("Handled config update")

    # Start threads, just call parent
    async def start(self):
--- a/trustgraph-base/trustgraph/base/graph_embeddings_client.py
+++ b/trustgraph-base/trustgraph/base/graph_embeddings_client.py
@ -1,8 +1,13 @@

+import logging
+
 from . request_response_spec import RequestResponse, RequestResponseSpec
 from .. schema import GraphEmbeddingsRequest, GraphEmbeddingsResponse
 from .. knowledge import Uri, Literal

+# Module logger
+logger = logging.getLogger(__name__)
+
 def to_value(x):
    if x.is_uri: return Uri(x.value)
    return Literal(x.value)
@ -21,7 +26,7 @@ class GraphEmbeddingsClient(RequestResponse):
            timeout=timeout
        )

-        print(resp, flush=True)
+        logger.debug(f"Graph embeddings response: {resp}")

        if resp.error:
            raise RuntimeError(resp.error.message)
--- a/trustgraph-base/trustgraph/base/graph_embeddings_query_service.py
+++ b/trustgraph-base/trustgraph/base/graph_embeddings_query_service.py
@ -4,6 +4,8 @@ Graph embeddings query service.  Input is vectors.  Output is list of
 embeddings.
 """

+import logging
+
 from .. schema import GraphEmbeddingsRequest, GraphEmbeddingsResponse
 from .. schema import Error, Value

@ -11,6 +13,9 @@ from . flow_processor import FlowProcessor
 from . consumer_spec import ConsumerSpec
 from . producer_spec import ProducerSpec

+# Module logger
+logger = logging.getLogger(__name__)
+
 default_ident = "ge-query"

 class GraphEmbeddingsQueryService(FlowProcessor):
@ -47,21 +52,21 @@ class GraphEmbeddingsQueryService(FlowProcessor):
            # Sender-produced ID
            id = msg.properties()["id"]

-            print(f"Handling input {id}...", flush=True)
+            logger.debug(f"Handling graph embeddings query request {id}...")

            entities = await self.query_graph_embeddings(request)

-            print("Send response...", flush=True)
+            logger.debug("Sending graph embeddings query response...")
            r = GraphEmbeddingsResponse(entities=entities, error=None)
            await flow("response").send(r, properties={"id": id})

-            print("Done.", flush=True)
+            logger.debug("Graph embeddings query request completed")

        except Exception as e:

-            print(f"Exception: {e}")
+            logger.error(f"Exception in graph embeddings query service: {e}", exc_info=True)

-            print("Send error response...", flush=True)
+            logger.info("Sending error response...")

            r = GraphEmbeddingsResponse(
                error=Error(
--- a/trustgraph-base/trustgraph/base/graph_embeddings_store_service.py
+++ b/trustgraph-base/trustgraph/base/graph_embeddings_store_service.py
@ -3,10 +3,15 @@
 Graph embeddings store base class
 """

+import logging
+
 from .. schema import GraphEmbeddings
 from .. base import FlowProcessor, ConsumerSpec
 from .. exceptions import TooManyRequests

+# Module logger
+logger = logging.getLogger(__name__)
+
 default_ident = "graph-embeddings-write"

 class GraphEmbeddingsStoreService(FlowProcessor):
@ -40,7 +45,7 @@ class GraphEmbeddingsStoreService(FlowProcessor):

        except Exception as e:
            
-            print(f"Exception: {e}")
+            logger.error(f"Exception in graph embeddings store service: {e}", exc_info=True)
            raise e

    @staticmethod
--- a/trustgraph-base/trustgraph/base/llm_service.py
+++ b/trustgraph-base/trustgraph/base/llm_service.py
@ -4,12 +4,16 @@ LLM text completion base class
 """

 import time
+import logging
 from prometheus_client import Histogram

 from .. schema import TextCompletionRequest, TextCompletionResponse, Error
 from .. exceptions import TooManyRequests
 from .. base import FlowProcessor, ConsumerSpec, ProducerSpec

+# Module logger
+logger = logging.getLogger(__name__)
+
 default_ident = "text-completion"
 default_concurrency = 1

@ -103,9 +107,9 @@ class LlmService(FlowProcessor):

            # Apart from rate limits, treat all exceptions as unrecoverable

-            print(f"Exception: {e}")
+            logger.error(f"LLM service exception: {e}", exc_info=True)

-            print("Send error response...", flush=True)
+            logger.debug("Sending error response...")

            await flow.producer["response"].send(
                TextCompletionResponse(
--- a/trustgraph-base/trustgraph/base/producer.py
+++ b/trustgraph-base/trustgraph/base/producer.py
@ -1,6 +1,10 @@

 from pulsar.schema import JsonSchema
 import asyncio
+import logging
+
+# Module logger
+logger = logging.getLogger(__name__)

 class Producer:

@ -39,15 +43,15 @@ class Producer:
        while self.running and self.producer is None:

            try:
-                print("Connect publisher to", self.topic, "...", flush=True)
+                logger.info(f"Connecting publisher to {self.topic}...")
                self.producer = self.client.create_producer(
                    topic = self.topic,
                    schema = JsonSchema(self.schema),
                    chunking_enabled = self.chunking_enabled,
                )
-                print("Connected to", self.topic, flush=True)
+                logger.info(f"Connected publisher to {self.topic}")
            except Exception as e:
-                print("Exception:", e, flush=True)
+                logger.error(f"Exception connecting publisher: {e}", exc_info=True)
                await asyncio.sleep(2)

            if not self.running: break
@ -68,7 +72,7 @@ class Producer:
                break

            except Exception as e:
-                print("Exception:", e, flush=True)
+                logger.error(f"Exception sending message: {e}", exc_info=True)
                self.producer.close()
                self.producer = None

--- a/trustgraph-base/trustgraph/base/prompt_client.py
+++ b/trustgraph-base/trustgraph/base/prompt_client.py
@ -40,6 +40,13 @@ class PromptClient(RequestResponse):
            timeout = timeout,
        )

+    async def extract_objects(self, text, schema, timeout=600):
+        return await self.prompt(
+            id = "extract-rows",
+            variables = { "text": text, "schema": schema, },
+            timeout = timeout,
+        )
+
    async def kg_prompt(self, query, kg, timeout=600):
        return await self.prompt(
            id = "kg-prompt",
--- a/trustgraph-base/trustgraph/base/publisher.py
+++ b/trustgraph-base/trustgraph/base/publisher.py
@ -4,6 +4,10 @@ from pulsar.schema import JsonSchema
 import asyncio
 import time
 import pulsar
+import logging
+
+# Module logger
+logger = logging.getLogger(__name__)

 class Publisher:

@ -62,7 +66,7 @@ class Publisher:
                        producer.send(item)

            except Exception as e:
-                print("Exception:", e, flush=True)
+                logger.error(f"Exception in publisher: {e}", exc_info=True)

            if not self.running:
                return
--- a/trustgraph-base/trustgraph/base/pubsub.py
+++ b/trustgraph-base/trustgraph/base/pubsub.py
@ -1,6 +1,7 @@

 import os
 import pulsar
+import _pulsar
 import uuid
 from pulsar.schema import JsonSchema

@ -21,7 +22,7 @@ class PulsarClient:
            "pulsar_api_key",
            self.default_pulsar_api_key
        )
-        log_level = params.get("log_level", LogLevel.INFO)
+        # Hard-code Pulsar logging to ERROR level to minimize noise

        self.pulsar_host = pulsar_host
        self.pulsar_api_key = pulsar_api_key
@ -31,13 +32,13 @@ class PulsarClient:
            self.client = pulsar.Client(
                pulsar_host,
                authentication=auth,
-                logger=pulsar.ConsoleLogger(log_level.to_pulsar())
+                logger=pulsar.ConsoleLogger(_pulsar.LoggerLevel.Error)
            )
        else:
            self.client = pulsar.Client(
                pulsar_host,
                listener_name=pulsar_listener,
-                logger=pulsar.ConsoleLogger(log_level.to_pulsar())
+                logger=pulsar.ConsoleLogger(_pulsar.LoggerLevel.Error)
            )

        self.pulsar_listener = pulsar_listener
@ -73,8 +74,7 @@ class PulsarClient:

        parser.add_argument(
            '-l', '--log-level',
-            type=LogLevel,
-            default=LogLevel.INFO,
-            choices=list(LogLevel),
-            help=f'Output queue (default: info)'
+            default='INFO',
+            choices=['DEBUG', 'INFO', 'WARNING', 'ERROR', 'CRITICAL'],
+            help=f'Log level (default: INFO)'
        )
--- a/trustgraph-base/trustgraph/base/request_response_spec.py
+++ b/trustgraph-base/trustgraph/base/request_response_spec.py
@ -1,12 +1,16 @@

 import uuid
 import asyncio
+import logging

 from . subscriber import Subscriber
 from . producer import Producer
 from . spec import Spec
 from . metrics import ConsumerMetrics, ProducerMetrics, SubscriberMetrics

+# Module logger
+logger = logging.getLogger(__name__)
+
 class RequestResponse(Subscriber):

    def __init__(
@ -45,7 +49,7 @@ class RequestResponse(Subscriber):

        id = str(uuid.uuid4())

-        print("Request", id, "...", flush=True)
+        logger.debug(f"Sending request {id}...")

        q = await self.subscribe(id)

@ -58,7 +62,7 @@ class RequestResponse(Subscriber):

        except Exception as e:

-            print("Exception:", e)
+            logger.error(f"Exception sending request: {e}", exc_info=True)
            raise e


@ -71,7 +75,7 @@ class RequestResponse(Subscriber):
                    timeout=timeout
                )

-                print("Got response.", flush=True)
+                logger.debug("Received response")

                if recipient is None:

@ -93,7 +97,7 @@ class RequestResponse(Subscriber):

        except Exception as e:

-            print("Exception:", e)
+            logger.error(f"Exception processing response: {e}", exc_info=True)
            raise e

        finally:
--- a/trustgraph-base/trustgraph/base/subscriber.py
+++ b/trustgraph-base/trustgraph/base/subscriber.py
@ -7,6 +7,10 @@ from pulsar.schema import JsonSchema
 import asyncio
 import _pulsar
 import time
+import logging
+
+# Module logger
+logger = logging.getLogger(__name__)

 class Subscriber:

@ -66,7 +70,7 @@ class Subscriber:
                if self.metrics:
                    self.metrics.state("running")

-                print("Subscriber running...", flush=True)
+                logger.info("Subscriber running...")

                while self.running:

@ -78,8 +82,7 @@ class Subscriber:
                    except _pulsar.Timeout:
                        continue
                    except Exception as e:
-                        print("Exception:", e, flush=True)
-                        print(type(e))
+                        logger.error(f"Exception in subscriber receive: {e}", exc_info=True)
                        raise e

                    if self.metrics:
@ -110,7 +113,7 @@ class Subscriber:

                            except Exception as e:
                                self.metrics.dropped()
-                                print("Q Put:", e, flush=True)
+                                logger.warning(f"Failed to put message in queue: {e}")

                        for q in self.full.values():
                            try:
@ -121,10 +124,10 @@ class Subscriber:
                                )
                            except Exception as e:
                                self.metrics.dropped()
-                                print("Q Put:", e, flush=True)
+                                logger.warning(f"Failed to put message in full queue: {e}")

            except Exception as e:
-                print("Subscriber exception:", e, flush=True)
+                logger.error(f"Subscriber exception: {e}", exc_info=True)

            finally:

--- a/trustgraph-base/trustgraph/base/tool_client.py
+++ b/trustgraph-base/trustgraph/base/tool_client.py
@ -0,0 +1,40 @@
+
+import json
+
+from . request_response_spec import RequestResponse, RequestResponseSpec
+from .. schema import ToolRequest, ToolResponse
+
+class ToolClient(RequestResponse):
+
+    async def invoke(self, name, parameters={}, timeout=600):
+
+        if parameters is None:
+            parameters = {}
+
+        resp = await self.request(
+            ToolRequest(
+                name = name,
+                parameters = json.dumps(parameters),
+            ),
+            timeout=timeout
+        )
+
+        if resp.error:
+            raise RuntimeError(resp.error.message)
+
+        if resp.text: return resp.text
+
+        return json.loads(resp.object)
+
+class ToolClientSpec(RequestResponseSpec):
+    def __init__(
+            self, request_name, response_name,
+    ):
+        super(ToolClientSpec, self).__init__(
+            request_name = request_name,
+            request_schema = ToolRequest,
+            response_name = response_name,
+            response_schema = ToolResponse,
+            impl = ToolClient,
+        )
+
--- a/trustgraph-base/trustgraph/base/tool_service.py
+++ b/trustgraph-base/trustgraph/base/tool_service.py
@ -0,0 +1,125 @@
+
+"""
+Tool invocation base class
+"""
+
+import json
+import logging
+from prometheus_client import Counter
+
+from .. schema import ToolRequest, ToolResponse, Error
+from .. exceptions import TooManyRequests
+from .. base import FlowProcessor, ConsumerSpec, ProducerSpec
+
+# Module logger
+logger = logging.getLogger(__name__)
+
+default_concurrency = 1
+
+class ToolService(FlowProcessor):
+
+    def __init__(self, **params):
+
+        id = params.get("id")
+        concurrency = params.get("concurrency", 1)
+
+        super(ToolService, self).__init__(**params | {
+            "id": id,
+            "concurrency": concurrency,
+        })
+
+        self.register_specification(
+            ConsumerSpec(
+                name = "request",
+                schema = ToolRequest,
+                handler = self.on_request,
+                concurrency = concurrency,
+            )
+        )
+
+        self.register_specification(
+            ProducerSpec(
+                name = "response",
+                schema = ToolResponse
+            )
+        )
+
+        if not hasattr(__class__, "tool_invocation_metric"):
+            __class__.tool_invocation_metric = Counter(
+                'tool_invocation_count', 'Tool invocation count',
+                ["id", "flow", "name"],
+            )
+
+    async def on_request(self, msg, consumer, flow):
+
+        try:
+
+            request = msg.value()
+
+            # Sender-produced ID
+
+            id = msg.properties()["id"]
+
+            response = await self.invoke_tool(
+                request.name,
+                json.loads(request.parameters) if request.parameters else {},
+            )
+
+            if isinstance(response, str):
+                await flow("response").send(
+                    ToolResponse(
+                        error=None,
+                        text=response,
+                        object=None,
+                    ),
+                    properties={"id": id}
+                )
+            else:
+                await flow("response").send(
+                    ToolResponse(
+                        error=None,
+                        text=None,
+                        object=json.dumps(response),
+                    ),
+                    properties={"id": id}
+                )
+
+            __class__.tool_invocation_metric.labels(
+                id = self.id, flow = flow.name, name = request.name,
+            ).inc()
+
+        except TooManyRequests as e:
+            raise e
+
+        except Exception as e:
+
+            # Apart from rate limits, treat all exceptions as unrecoverable
+
+            logger.error(f"Exception in tool service: {e}", exc_info=True)
+
+            logger.info("Sending error response...")
+
+            await flow.producer["response"].send(
+                ToolResponse(
+                    error=Error(
+                        type = "tool-error",
+                        message = str(e),
+                    ),
+                    text=None,
+                    object=None,
+                ),
+                properties={"id": id}
+            )
+
+    @staticmethod
+    def add_args(parser):
+
+        parser.add_argument(
+            '-c', '--concurrency',
+            type=int,
+            default=default_concurrency,
+            help=f'Concurrent processing threads (default: {default_concurrency})'
+        )
+
+        FlowProcessor.add_args(parser)
+
--- a/trustgraph-base/trustgraph/base/triples_query_service.py
+++ b/trustgraph-base/trustgraph/base/triples_query_service.py
@ -4,6 +4,8 @@ Triples query service.  Input is a (s, p, o) triple, some values may be
 null.  Output is a list of triples.
 """

+import logging
+
 from .. schema import TriplesQueryRequest, TriplesQueryResponse, Error
 from .. schema import Value, Triple

@ -11,6 +13,9 @@ from . flow_processor import FlowProcessor
 from . consumer_spec import  ConsumerSpec
 from . producer_spec import ProducerSpec

+# Module logger
+logger = logging.getLogger(__name__)
+
 default_ident = "triples-query"

 class TriplesQueryService(FlowProcessor):
@ -45,21 +50,21 @@ class TriplesQueryService(FlowProcessor):
            # Sender-produced ID
            id = msg.properties()["id"]

-            print(f"Handling input {id}...", flush=True)
+            logger.debug(f"Handling triples query request {id}...")

            triples = await self.query_triples(request)

-            print("Send response...", flush=True)
+            logger.debug("Sending triples query response...")
            r = TriplesQueryResponse(triples=triples, error=None)
            await flow("response").send(r, properties={"id": id})

-            print("Done.", flush=True)
+            logger.debug("Triples query request completed")

        except Exception as e:

-            print(f"Exception: {e}")
+            logger.error(f"Exception in triples query service: {e}", exc_info=True)

-            print("Send error response...", flush=True)
+            logger.info("Sending error response...")

            r = TriplesQueryResponse(
                error = Error(
--- a/trustgraph-base/trustgraph/base/triples_store_service.py
+++ b/trustgraph-base/trustgraph/base/triples_store_service.py
@ -3,10 +3,15 @@
 Triples store base class
 """

+import logging
+
 from .. schema import Triples
 from .. base import FlowProcessor, ConsumerSpec
 from .. exceptions import TooManyRequests

+# Module logger
+logger = logging.getLogger(__name__)
+
 default_ident = "triples-write"

 class TriplesStoreService(FlowProcessor):
@ -38,7 +43,7 @@ class TriplesStoreService(FlowProcessor):

        except Exception as e:
            
-            print(f"Exception: {e}")
+            logger.error(f"Exception in triples store service: {e}", exc_info=True)
            raise e

    @staticmethod