diff --git a/trustgraph-flow/trustgraph/chunking/recursive/chunker.py b/trustgraph-flow/trustgraph/chunking/recursive/chunker.py index 8604f4fa..bc6d9cb9 100755 --- a/trustgraph-flow/trustgraph/chunking/recursive/chunker.py +++ b/trustgraph-flow/trustgraph/chunking/recursive/chunker.py @@ -76,6 +76,12 @@ class Processor(ChunkingService): self.default_chunk_overlap ) + # Convert to int if they're strings (flow parameters are always strings) + if isinstance(chunk_size, str): + chunk_size = int(chunk_size) + if isinstance(chunk_overlap, str): + chunk_overlap = int(chunk_overlap) + # Create text splitter with effective parameters text_splitter = RecursiveCharacterTextSplitter( chunk_size=chunk_size, diff --git a/trustgraph-flow/trustgraph/chunking/token/chunker.py b/trustgraph-flow/trustgraph/chunking/token/chunker.py index b4e55038..876cab07 100755 --- a/trustgraph-flow/trustgraph/chunking/token/chunker.py +++ b/trustgraph-flow/trustgraph/chunking/token/chunker.py @@ -75,6 +75,12 @@ class Processor(ChunkingService): self.default_chunk_overlap ) + # Convert to int if they're strings (flow parameters are always strings) + if isinstance(chunk_size, str): + chunk_size = int(chunk_size) + if isinstance(chunk_overlap, str): + chunk_overlap = int(chunk_overlap) + # Create text splitter with effective parameters text_splitter = TokenTextSplitter( encoding_name="cl100k_base", diff --git a/trustgraph-flow/trustgraph/query/doc_embeddings/qdrant/service.py b/trustgraph-flow/trustgraph/query/doc_embeddings/qdrant/service.py index 82134db9..f4e04e98 100755 --- a/trustgraph-flow/trustgraph/query/doc_embeddings/qdrant/service.py +++ b/trustgraph-flow/trustgraph/query/doc_embeddings/qdrant/service.py @@ -61,6 +61,10 @@ class Processor(DocumentEmbeddingsQueryService): """Check if collection exists (no implicit creation)""" return self.qdrant.collection_exists(collection) + def collection_exists(self, collection): + """Check if collection exists (no implicit creation)""" + return self.qdrant.collection_exists(collection) + async def query_document_embeddings(self, msg): try: diff --git a/trustgraph-flow/trustgraph/query/graph_embeddings/qdrant/service.py b/trustgraph-flow/trustgraph/query/graph_embeddings/qdrant/service.py index 1cdba33d..6e6be420 100755 --- a/trustgraph-flow/trustgraph/query/graph_embeddings/qdrant/service.py +++ b/trustgraph-flow/trustgraph/query/graph_embeddings/qdrant/service.py @@ -61,6 +61,10 @@ class Processor(GraphEmbeddingsQueryService): """Check if collection exists (no implicit creation)""" return self.qdrant.collection_exists(collection) + def collection_exists(self, collection): + """Check if collection exists (no implicit creation)""" + return self.qdrant.collection_exists(collection) + def create_value(self, ent): if ent.startswith("http://") or ent.startswith("https://"): return Value(value=ent, is_uri=True) @@ -85,8 +89,6 @@ class Processor(GraphEmbeddingsQueryService): for vec in msg.vectors: - self.ensure_collection_exists(collection, dim) - # Heuristic hack, get (2*limit), so that we have more chance # of getting (limit) entities search_result = self.qdrant.query_points(