SurfSense/surfsense_backend/app/indexing_pipeline/document_chunker.py

8 lines
332 B
Python
Raw Normal View History

2026-02-25 01:40:30 +02:00
from app.config import config
def chunk_text(text: str, use_code_chunker: bool = False) -> list[str]:
2026-02-25 01:40:30 +02:00
"""Chunk a text string using the configured chunker and return the chunk texts."""
chunker = config.code_chunker_instance if use_code_chunker else config.chunker_instance
return [c.text for c in chunker.chunk(text)]