diff --git a/ocr.py b/ocr.py index c5b2794..69be57c 100644 --- a/ocr.py +++ b/ocr.py @@ -37,7 +37,7 @@ async def read_images_from_dir(dir_path, lang='eng', write_to_file=False): converted_text[os.path.join(dir_path, file_)] = text if write_to_file: for file_path, text in converted_text.items(): - _write_to_file(text, os.path.splitext(file_path)[0] + ".txt") + _write_to_file(text, f'{os.path.splitext(file_path)[0]}.txt') return converted_text def _write_to_file(text, file_path): diff --git a/server.py b/server.py index dee9adb..c97f104 100644 --- a/server.py +++ b/server.py @@ -33,10 +33,12 @@ async def bulk_extract_text(request: Request, bg_task: BackgroundTasks): @app.get("/api/v1/bulk_output/{task_id}") async def bulk_output(task_id): - text_map = {} - for file_ in os.listdir(task_id): - if file_.endswith("txt"): - text_map[file_] = open(os.path.join(task_id, file_)).read() + text_map = { + file_: open(os.path.join(task_id, file_)).read() + for file_ in os.listdir(task_id) + if file_.endswith("txt") + } + return {"task_id": task_id, "output": text_map} def _save_file_to_disk(uploaded_file, path=".", save_as="default"):