feat(conversion): switch PDF input engine to pdftohtml for improved performance and reduced dependencies (#5820)

This commit is contained in:
Balázs Szücs
2026-03-02 14:55:42 +01:00
committed by GitHub
parent cfe040485b
commit 48dd4154e9
4 changed files with 173 additions and 30 deletions

View File

@@ -245,7 +245,7 @@ ENV PATH="/opt/venv/bin:$PATH"
# Build all heavy python packages here
RUN --mount=type=cache,target=/root/.cache/pip \
pip install \
weasyprint pdf2image opencv-python-headless ocrmypdf \
weasyprint pdf2image opencv-python-headless ocrmypdf \
"unoserver==${UNOSERVER_VERSION}"