SurfSense/surfsense_backend/app/indexing_pipeline/document_chunker.py

10 lines
348 B
Python
Raw Normal View History

2026-02-25 01:40:30 +02:00
from app.config import config
def chunk_text(text: str, use_code_chunker: bool = False) -> list[str]:
2026-02-25 01:40:30 +02:00
"""Chunk a text string using the configured chunker and return the chunk texts."""
2026-02-26 03:05:20 +05:30
chunker = (
config.code_chunker_instance if use_code_chunker else config.chunker_instance
)
return [c.text for c in chunker.chunk(text)]