diff --git a/rag-engine/src/process/service.py b/rag-engine/src/process/service.py index 3254e22..e784c9a 100644 --- a/rag-engine/src/process/service.py +++ b/rag-engine/src/process/service.py @@ -1,6 +1,6 @@ import logging -from src.layers.chunking.chunk_document import chunk_document -from src.layers.chunking.embedding import embed_chunks +from src.layers.chunking_embedding.chunk_document import chunk_document +from src.layers.chunking_embedding.embedding import embed_chunks from src.layers.data_extractor import extractor from src.layers.structure_analyzer.analyzer import analyze_layout @@ -13,7 +13,9 @@ def processFile(fileType: models.FileType, file_bytes: bytes, metadata: dict): pages, extractor_meta = extractor.pdf(file_bytes) structured_document = analyze_layout(pages) chunks = chunk_document( - structured_document, extractor_meta | metadata, max_tokens=400 + structured_document, + extractor_meta | metadata, + max_tokens=400, ) logging.info(f"pdf data extracted pages: {len(pages)}") chunks = embed_chunks(chunks)