Feature/prompts jsonl (#619)

* Tech spec * JSONL implementation complete * Updated prompt client users * Fix tests
2026-06-17 10:55:14 +02:00 · 2026-01-26 17:38:00 +00:00 · 2026-01-26 17:38:00 +00:00 · e214eb4e02
commit e214eb4e02
parent e4f0013841
8 changed files with 1292 additions and 463 deletions
--- a/trustgraph-flow/trustgraph/template/prompt_manager.py
+++ b/trustgraph-flow/trustgraph/template/prompt_manager.py
@ -83,7 +83,7 @@ class PromptManager:

    def parse_json(self, text):
        json_match = re.search(r'```(?:json)?(.*?)```', text, re.DOTALL)
-    
+
        if json_match:
            json_str = json_match.group(1).strip()
        else:
@ -92,6 +92,43 @@ class PromptManager:

        return json.loads(json_str)

+    def parse_jsonl(self, text):
+        """
+        Parse JSONL response, returning list of valid objects.
+
+        Invalid lines (malformed JSON, empty lines) are skipped with warnings.
+        This provides truncation resilience - partial output yields partial results.
+        """
+        results = []
+
+        # Strip markdown code fences if present
+        text = text.strip()
+        if text.startswith('```'):
+            # Remove opening fence (possibly with language hint)
+            text = re.sub(r'^```(?:json|jsonl)?\s*\n?', '', text)
+        if text.endswith('```'):
+            text = text[:-3]
+
+        for line_num, line in enumerate(text.strip().split('\n'), 1):
+            line = line.strip()
+
+            # Skip empty lines
+            if not line:
+                continue
+
+            # Skip any remaining fence markers
+            if line.startswith('```'):
+                continue
+
+            try:
+                obj = json.loads(line)
+                results.append(obj)
+            except json.JSONDecodeError as e:
+                # Log warning but continue - this provides truncation resilience
+                logger.warning(f"JSONL parse error on line {line_num}: {e}")
+
+        return results
+
    def render(self, id, input):

        if id not in self.prompts:
@ -121,21 +158,41 @@ class PromptManager:
        if resp_type == "text":
            return resp

-        if resp_type != "json":
-            raise RuntimeError(f"Response type {resp_type} not known")
-
-        try:
-            obj = self.parse_json(resp)
-        except:
-            logger.error(f"JSON parse failed: {resp}")
-            raise RuntimeError("JSON parse fail")
-
-        if self.prompts[id].schema:
+        if resp_type == "json":
            try:
-                validate(instance=obj, schema=self.prompts[id].schema)
-                logger.debug("Schema validation successful")
-            except Exception as e:
-                raise RuntimeError(f"Schema validation fail: {e}")
+                obj = self.parse_json(resp)
+            except:
+                logger.error(f"JSON parse failed: {resp}")
+                raise RuntimeError("JSON parse fail")

-        return obj
+            if self.prompts[id].schema:
+                try:
+                    validate(instance=obj, schema=self.prompts[id].schema)
+                    logger.debug("Schema validation successful")
+                except Exception as e:
+                    raise RuntimeError(f"Schema validation fail: {e}")
+
+            return obj
+
+        if resp_type == "jsonl":
+            objects = self.parse_jsonl(resp)
+
+            if not objects:
+                logger.warning("JSONL parse returned no valid objects")
+                return []
+
+            # Validate each object against schema if provided
+            if self.prompts[id].schema:
+                validated = []
+                for i, obj in enumerate(objects):
+                    try:
+                        validate(instance=obj, schema=self.prompts[id].schema)
+                        validated.append(obj)
+                    except Exception as e:
+                        logger.warning(f"Object {i} failed schema validation: {e}")
+                return validated
+
+            return objects
+
+        raise RuntimeError(f"Response type {resp_type} not known")