Implement logging strategy (#444)

* Logging strategy and convert all prints() to logging invocations
2026-04-28 09:56:22 +02:00 · 2025-07-30 23:18:38 +01:00 · 2025-07-30 23:18:38 +01:00 · dd70aade11
commit dd70aade11
parent 3e0651222b
117 changed files with 1216 additions and 667 deletions
--- a/trustgraph-flow/trustgraph/retrieval/document_rag/document_rag.py
+++ b/trustgraph-flow/trustgraph/retrieval/document_rag/document_rag.py
@ -1,5 +1,9 @@

 import asyncio
+import logging
+
+# Module logger
+logger = logging.getLogger(__name__)

 LABEL="http://www.w3.org/2000/01/rdf-schema#label"

@ -18,12 +22,12 @@ class Query:
    async def get_vector(self, query):

        if self.verbose:
-            print("Compute embeddings...", flush=True)
+            logger.debug("Computing embeddings...")

        qembeds = await  self.rag.embeddings_client.embed(query)

        if self.verbose:
-            print("Done.", flush=True)
+            logger.debug("Embeddings computed")

        return qembeds

@ -32,7 +36,7 @@ class Query:
        vectors = await self.get_vector(query)

        if self.verbose:
-            print("Get docs...", flush=True)
+            logger.debug("Getting documents...")

        docs = await self.rag.doc_embeddings_client.query(
            vectors, limit=self.doc_limit,
@ -40,9 +44,9 @@ class Query:
        )

        if self.verbose:
-            print("Docs:", flush=True)
+            logger.debug("Documents:")
            for doc in docs:
-                print(doc, flush=True)
+                logger.debug(f"  {doc}")

        return docs

@ -60,7 +64,7 @@ class DocumentRag:
        self.doc_embeddings_client = doc_embeddings_client

        if self.verbose:
-            print("Initialised", flush=True)
+            logger.debug("DocumentRag initialized")

    async def query(
            self, query, user="trustgraph", collection="default",
@ -68,7 +72,7 @@ class DocumentRag:
    ):

        if self.verbose:
-            print("Construct prompt...", flush=True)
+            logger.debug("Constructing prompt...")

        q = Query(
            rag=self, user=user, collection=collection, verbose=self.verbose,
@ -78,9 +82,9 @@ class DocumentRag:
        docs = await q.get_docs(query)

        if self.verbose:
-            print("Invoke LLM...", flush=True)
-            print(docs)
-            print(query)
+            logger.debug("Invoking LLM...")
+            logger.debug(f"Documents: {docs}")
+            logger.debug(f"Query: {query}")

        resp = await self.prompt_client.document_prompt(
            query = query,
@ -88,7 +92,7 @@ class DocumentRag:
        )

        if self.verbose:
-            print("Done", flush=True)
+            logger.debug("Query processing complete")

        return resp

--- a/trustgraph-flow/trustgraph/retrieval/document_rag/rag.py
+++ b/trustgraph-flow/trustgraph/retrieval/document_rag/rag.py
@ -4,12 +4,16 @@ Simple RAG service, performs query using document RAG an LLM.
 Input is query, output is response.
 """

+import logging
 from ... schema import DocumentRagQuery, DocumentRagResponse, Error
 from . document_rag import DocumentRag
 from ... base import FlowProcessor, ConsumerSpec, ProducerSpec
 from ... base import PromptClientSpec, EmbeddingsClientSpec
 from ... base import DocumentEmbeddingsClientSpec

+# Module logger
+logger = logging.getLogger(__name__)
+
 default_ident = "document-rag"

 class Processor(FlowProcessor):
@ -81,7 +85,7 @@ class Processor(FlowProcessor):
            # Sender-produced ID
            id = msg.properties()["id"]

-            print(f"Handling input {id}...", flush=True)
+            logger.info(f"Handling input {id}...")

            if v.doc_limit:
                doc_limit = v.doc_limit
@ -98,13 +102,13 @@ class Processor(FlowProcessor):
                properties = {"id": id}
            )

-            print("Done.", flush=True)
+            logger.info("Request processing complete")

        except Exception as e:

-            print(f"Exception: {e}")
+            logger.error(f"Document RAG service exception: {e}", exc_info=True)

-            print("Send error response...", flush=True)
+            logger.debug("Sending error response...")

            await flow("response").send(
                DocumentRagResponse(
--- a/trustgraph-flow/trustgraph/retrieval/graph_rag/graph_rag.py
+++ b/trustgraph-flow/trustgraph/retrieval/graph_rag/graph_rag.py
@ -1,5 +1,9 @@

 import asyncio
+import logging
+
+# Module logger
+logger = logging.getLogger(__name__)

 LABEL="http://www.w3.org/2000/01/rdf-schema#label"

@ -22,12 +26,12 @@ class Query:
    async def get_vector(self, query):

        if self.verbose:
-            print("Compute embeddings...", flush=True)
+            logger.debug("Computing embeddings...")

        qembeds = await  self.rag.embeddings_client.embed(query)

        if self.verbose:
-            print("Done.", flush=True)
+            logger.debug("Done.")

        return qembeds

@ -36,7 +40,7 @@ class Query:
        vectors = await self.get_vector(query)

        if self.verbose:
-            print("Get entities...", flush=True)
+            logger.debug("Getting entities...")

        entities = await self.rag.graph_embeddings_client.query(
            vectors=vectors, limit=self.entity_limit,
@ -49,9 +53,9 @@ class Query:
        ]

        if self.verbose:
-            print("Entities:", flush=True)
+            logger.debug("Entities:")
            for ent in entities:
-                print(" ", ent, flush=True)
+                logger.debug(f"  {ent}")

        return entities
        
@ -126,7 +130,7 @@ class Query:
        entities = await self.get_entities(query)

        if self.verbose:
-            print("Get subgraph...", flush=True)
+            logger.debug("Getting subgraph...")

        subgraph = set()

@ -157,12 +161,12 @@ class Query:
        sg2 = sg2[0:self.max_subgraph_size]

        if self.verbose:
-            print("Subgraph:", flush=True)
+            logger.debug("Subgraph:")
            for edge in sg2:
-                print(" ", str(edge), flush=True)
+                logger.debug(f"  {str(edge)}")

        if self.verbose:
-            print("Done.", flush=True)
+            logger.debug("Done.")

        return sg2
    
@ -183,7 +187,7 @@ class GraphRag:
        self.label_cache = {}

        if self.verbose:
-            print("Initialised", flush=True)
+            logger.debug("GraphRag initialized")

    async def query(
            self, query, user = "trustgraph", collection = "default",
@ -192,7 +196,7 @@ class GraphRag:
    ):

        if self.verbose:
-            print("Construct prompt...", flush=True)
+            logger.debug("Constructing prompt...")

        q = Query(
            rag = self, user = user, collection = collection,
@ -205,14 +209,14 @@ class GraphRag:
        kg = await q.get_labelgraph(query)

        if self.verbose:
-            print("Invoke LLM...", flush=True)
-            print(kg)
-            print(query)
+            logger.debug("Invoking LLM...")
+            logger.debug(f"Knowledge graph: {kg}")
+            logger.debug(f"Query: {query}")

        resp = await self.prompt_client.kg_prompt(query, kg)

        if self.verbose:
-            print("Done", flush=True)
+            logger.debug("Query processing complete")

        return resp

--- a/trustgraph-flow/trustgraph/retrieval/graph_rag/rag.py
+++ b/trustgraph-flow/trustgraph/retrieval/graph_rag/rag.py
@ -4,12 +4,16 @@ Simple RAG service, performs query using graph RAG an LLM.
 Input is query, output is response.
 """

+import logging
 from ... schema import GraphRagQuery, GraphRagResponse, Error
 from . graph_rag import GraphRag
 from ... base import FlowProcessor, ConsumerSpec, ProducerSpec
 from ... base import PromptClientSpec, EmbeddingsClientSpec
 from ... base import GraphEmbeddingsClientSpec, TriplesClientSpec

+# Module logger
+logger = logging.getLogger(__name__)
+
 default_ident = "graph-rag"
 default_concurrency = 1

@ -102,7 +106,7 @@ class Processor(FlowProcessor):
            # Sender-produced ID
            id = msg.properties()["id"]
         
-            print(f"Handling input {id}...", flush=True)
+            logger.info(f"Handling input {id}...")

            if v.entity_limit:
                entity_limit = v.entity_limit
@ -139,13 +143,13 @@ class Processor(FlowProcessor):
                properties = {"id": id}
            )

-            print("Done.", flush=True)
+            logger.info("Request processing complete")

        except Exception as e:

-            print(f"Exception: {e}")
+            logger.error(f"Graph RAG service exception: {e}", exc_info=True)

-            print("Send error response...", flush=True)
+            logger.debug("Sending error response...")

            await flow("response").send(
                GraphRagResponse(