diff --git a/backend/app/utils/docx_parser.py b/backend/app/utils/docx_parser.py index 9e06804..7205cda 100644 --- a/backend/app/utils/docx_parser.py +++ b/backend/app/utils/docx_parser.py @@ -1,17 +1,10 @@ from __future__ import annotations -from typing import Optional -Document = None - - -def _ensure_docx_imported(): - global Document - if Document is None: - try: - from docx import Document as _Doc # type: ignore - Document = _Doc - except Exception as exc: # pragma: no cover - missing optional dep - raise ValueError("DOCX library is not installed") from exc +try: + from docx import Document as _Doc + Document = _Doc +except Exception: + Document = None def parse_docx(file_path: str) -> str: @@ -23,9 +16,9 @@ def parse_docx(file_path: str) -> str: Raises: ValueError: If the file is not a valid DOCX document or cannot be read. """ + if Document is None: + raise ValueError("DOCX library is not installed") try: - _ensure_docx_imported() - assert Document is not None doc = Document(file_path) except Exception as exc: # pragma: no cover - surface invalid DOCX raise ValueError(f"Invalid DOCX file: {exc}") from exc diff --git a/backend/app/utils/pdf_parser.py b/backend/app/utils/pdf_parser.py index 86908c2..d9001f7 100644 --- a/backend/app/utils/pdf_parser.py +++ b/backend/app/utils/pdf_parser.py @@ -1,6 +1,3 @@ -from __future__ import annotations - -from typing import Optional from pypdf import PdfReader