mirror of
https://github.com/MODSetter/SurfSense.git
synced 2026-05-21 18:55:16 +02:00
chore: ran linting
This commit is contained in:
parent
30c6f42102
commit
580b75c3c4
3 changed files with 40 additions and 22 deletions
|
|
@ -399,7 +399,9 @@ async def _extract_text_with_etl(
|
||||||
from logging import ERROR, getLogger
|
from logging import ERROR, getLogger
|
||||||
|
|
||||||
etl_service = config.ETL_SERVICE
|
etl_service = config.ETL_SERVICE
|
||||||
logger.debug(f"[_extract_text_with_etl] START - file_path={file_path}, file_name={file_name}, etl_service={etl_service}")
|
logger.debug(
|
||||||
|
f"[_extract_text_with_etl] START - file_path={file_path}, file_name={file_name}, etl_service={etl_service}"
|
||||||
|
)
|
||||||
|
|
||||||
try:
|
try:
|
||||||
if etl_service == "UNSTRUCTURED":
|
if etl_service == "UNSTRUCTURED":
|
||||||
|
|
@ -419,10 +421,14 @@ async def _extract_text_with_etl(
|
||||||
)
|
)
|
||||||
|
|
||||||
docs = await loader.aload()
|
docs = await loader.aload()
|
||||||
logger.debug(f"[_extract_text_with_etl] UNSTRUCTURED loaded {len(docs) if docs else 0} docs")
|
logger.debug(
|
||||||
|
f"[_extract_text_with_etl] UNSTRUCTURED loaded {len(docs) if docs else 0} docs"
|
||||||
|
)
|
||||||
if docs:
|
if docs:
|
||||||
result = await convert_document_to_markdown(docs)
|
result = await convert_document_to_markdown(docs)
|
||||||
logger.debug(f"[_extract_text_with_etl] UNSTRUCTURED result: {len(result) if result else 0} chars")
|
logger.debug(
|
||||||
|
f"[_extract_text_with_etl] UNSTRUCTURED result: {len(result) if result else 0} chars"
|
||||||
|
)
|
||||||
return result
|
return result
|
||||||
logger.debug("[_extract_text_with_etl] UNSTRUCTURED returned no docs")
|
logger.debug("[_extract_text_with_etl] UNSTRUCTURED returned no docs")
|
||||||
return None
|
return None
|
||||||
|
|
@ -447,12 +453,18 @@ async def _extract_text_with_etl(
|
||||||
markdown_documents = await result.aget_markdown_documents(
|
markdown_documents = await result.aget_markdown_documents(
|
||||||
split_by_page=False
|
split_by_page=False
|
||||||
)
|
)
|
||||||
logger.debug(f"[_extract_text_with_etl] LLAMACLOUD got {len(markdown_documents) if markdown_documents else 0} markdown docs")
|
logger.debug(
|
||||||
|
f"[_extract_text_with_etl] LLAMACLOUD got {len(markdown_documents) if markdown_documents else 0} markdown docs"
|
||||||
|
)
|
||||||
if markdown_documents:
|
if markdown_documents:
|
||||||
text = markdown_documents[0].text
|
text = markdown_documents[0].text
|
||||||
logger.debug(f"[_extract_text_with_etl] LLAMACLOUD result: {len(text) if text else 0} chars")
|
logger.debug(
|
||||||
|
f"[_extract_text_with_etl] LLAMACLOUD result: {len(text) if text else 0} chars"
|
||||||
|
)
|
||||||
return text
|
return text
|
||||||
logger.debug("[_extract_text_with_etl] LLAMACLOUD returned no markdown docs")
|
logger.debug(
|
||||||
|
"[_extract_text_with_etl] LLAMACLOUD returned no markdown docs"
|
||||||
|
)
|
||||||
return None
|
return None
|
||||||
|
|
||||||
elif etl_service == "DOCLING":
|
elif etl_service == "DOCLING":
|
||||||
|
|
@ -480,20 +492,29 @@ async def _extract_text_with_etl(
|
||||||
result = await docling_service.process_document(
|
result = await docling_service.process_document(
|
||||||
file_path, file_name
|
file_path, file_name
|
||||||
)
|
)
|
||||||
logger.debug(f"[_extract_text_with_etl] DOCLING result keys: {list(result.keys()) if result else 'None'}")
|
logger.debug(
|
||||||
|
f"[_extract_text_with_etl] DOCLING result keys: {list(result.keys()) if result else 'None'}"
|
||||||
|
)
|
||||||
finally:
|
finally:
|
||||||
pdfminer_logger.setLevel(original_level)
|
pdfminer_logger.setLevel(original_level)
|
||||||
|
|
||||||
content = result.get("content")
|
content = result.get("content")
|
||||||
logger.debug(f"[_extract_text_with_etl] DOCLING content: {len(content) if content else 0} chars")
|
logger.debug(
|
||||||
|
f"[_extract_text_with_etl] DOCLING content: {len(content) if content else 0} chars"
|
||||||
|
)
|
||||||
return content
|
return content
|
||||||
else:
|
else:
|
||||||
logger.warning(f"[_extract_text_with_etl] Unknown ETL service: {etl_service}")
|
logger.warning(
|
||||||
|
f"[_extract_text_with_etl] Unknown ETL service: {etl_service}"
|
||||||
|
)
|
||||||
return None
|
return None
|
||||||
|
|
||||||
except Exception as e:
|
except Exception as e:
|
||||||
logger.error(f"[_extract_text_with_etl] ETL extraction EXCEPTION for {file_name}: {e!s}")
|
logger.error(
|
||||||
|
f"[_extract_text_with_etl] ETL extraction EXCEPTION for {file_name}: {e!s}"
|
||||||
|
)
|
||||||
import traceback
|
import traceback
|
||||||
|
|
||||||
logger.error(f"[_extract_text_with_etl] Traceback: {traceback.format_exc()}")
|
logger.error(f"[_extract_text_with_etl] Traceback: {traceback.format_exc()}")
|
||||||
return None
|
return None
|
||||||
|
|
||||||
|
|
|
||||||
|
|
@ -1357,14 +1357,11 @@ export default function NewChatPage() {
|
||||||
);
|
);
|
||||||
|
|
||||||
// Handle reloading/refreshing the last AI response
|
// Handle reloading/refreshing the last AI response
|
||||||
const onReload = useCallback(
|
const onReload = useCallback(async () => {
|
||||||
async () => {
|
// parentId is the ID of the message to reload from (the user message)
|
||||||
// parentId is the ID of the message to reload from (the user message)
|
// We call regenerate without a query to use the same query
|
||||||
// We call regenerate without a query to use the same query
|
await handleRegenerate(null);
|
||||||
await handleRegenerate(null);
|
}, [handleRegenerate]);
|
||||||
},
|
|
||||||
[handleRegenerate]
|
|
||||||
);
|
|
||||||
|
|
||||||
// Create external store runtime with attachment support
|
// Create external store runtime with attachment support
|
||||||
const runtime = useExternalStoreRuntime({
|
const runtime = useExternalStoreRuntime({
|
||||||
|
|
|
||||||
|
|
@ -428,7 +428,7 @@ export const DocumentMentionPicker = forwardRef<
|
||||||
<Skeleton className="h-4 w-4" />
|
<Skeleton className="h-4 w-4" />
|
||||||
</span>
|
</span>
|
||||||
<span className="flex-1 text-sm">
|
<span className="flex-1 text-sm">
|
||||||
<Skeleton className="h-[20px]" style={{ width: `${60 + (i * 7) % 30}%` }} />
|
<Skeleton className="h-[20px]" style={{ width: `${60 + ((i * 7) % 30)}%` }} />
|
||||||
</span>
|
</span>
|
||||||
</div>
|
</div>
|
||||||
))}
|
))}
|
||||||
|
|
|
||||||
Loading…
Add table
Add a link
Reference in a new issue