Flow temperature parameter (#533)

* Add temperature parameter to LlmService and roll out to all LLMs
2026-04-26 08:56:21 +02:00 · 2025-09-25 21:26:11 +01:00 · 2025-09-25 21:26:11 +01:00 · 6f4f7ce6b4
commit 6f4f7ce6b4
parent aa8e422e8c
15 changed files with 164 additions and 72 deletions
--- a/trustgraph-base/trustgraph/base/llm_service.py
+++ b/trustgraph-base/trustgraph/base/llm_service.py
@ -5,7 +5,7 @@ LLM text completion base class

 import time
 import logging
-from prometheus_client import Histogram
+from prometheus_client import Histogram, Info

 from .. schema import TextCompletionRequest, TextCompletionResponse, Error
 from .. exceptions import TooManyRequests
@ -62,6 +62,12 @@ class LlmService(FlowProcessor):
            )
        )

+        self.register_specification(
+            ParameterSpec(
+                name = "temperature",
+            )
+        )
+
        if not hasattr(__class__, "text_completion_metric"):
            __class__.text_completion_metric = Histogram(
                'text_completion_duration',
@ -76,6 +82,13 @@ class LlmService(FlowProcessor):
                ]
            )

+        if not hasattr(__class__, "text_completion_model_metric"):
+            __class__.text_completion_model_metric = Info(
+                'text_completion_model',
+                'Text completion model',
+                ["processor", "flow"]
+            )
+
    async def on_request(self, msg, consumer, flow):

        try:
@ -92,11 +105,19 @@ class LlmService(FlowProcessor):
            ).time():

                model = flow("model")
+                temperature = flow("temperature")

                response = await self.generate_content(
-                    request.system, request.prompt, model
+                    request.system, request.prompt, model, temperature
                )

+            await __class__.text_completion_model_metric.labels(
+                id = flow.id, flow = flow.name
+            ).info({
+                "model": model,
+                "temperature": temperature,
+            })
+
            await flow("response").send(
                TextCompletionResponse(
                    error=None,