From f4733021c500325a15d0fa5ac25ce5b1580128e1 Mon Sep 17 00:00:00 2001 From: cybermaggedon Date: Mon, 4 Aug 2025 14:01:36 +0100 Subject: [PATCH] Fix Mistral OCR ident to be standard pdf-decoder (#450) * Fix Mistral OCR ident to be standard pdf-decoder * Correct test --- tests/unit/test_decoding/test_mistral_ocr_processor.py | 4 ++-- trustgraph-flow/trustgraph/decoding/mistral_ocr/processor.py | 2 +- 2 files changed, 3 insertions(+), 3 deletions(-) diff --git a/tests/unit/test_decoding/test_mistral_ocr_processor.py b/tests/unit/test_decoding/test_mistral_ocr_processor.py index cb8362b7..4d7b9937 100644 --- a/tests/unit/test_decoding/test_mistral_ocr_processor.py +++ b/tests/unit/test_decoding/test_mistral_ocr_processor.py @@ -288,9 +288,9 @@ class TestMistralOcrProcessor(IsolatedAsyncioTestCase): run() # Assert - mock_launch.assert_called_once_with("mistral-ocr", + mock_launch.assert_called_once_with("pdf-decoder", "\nSimple decoder, accepts PDF documents on input, outputs pages from the\nPDF document as text as separate output objects.\n") if __name__ == '__main__': - pytest.main([__file__]) \ No newline at end of file + pytest.main([__file__]) diff --git a/trustgraph-flow/trustgraph/decoding/mistral_ocr/processor.py b/trustgraph-flow/trustgraph/decoding/mistral_ocr/processor.py index 9532fa0f..3cacb16c 100755 --- a/trustgraph-flow/trustgraph/decoding/mistral_ocr/processor.py +++ b/trustgraph-flow/trustgraph/decoding/mistral_ocr/processor.py @@ -21,7 +21,7 @@ import logging logger = logging.getLogger(__name__) -default_ident = "mistral-ocr" +default_ident = "pdf-decoder" default_api_key = os.getenv("MISTRAL_TOKEN") pages_per_chunk = 5