mirror of
https://github.com/infiniflow/ragflow.git
synced 2026-06-29 15:31:05 +08:00
Fix: upgrade Apache Tika from 3.2.3 to 3.3.0 to address GHSA-72hv-8253-57qq (#13769)
### What problem does this PR solve? Upgrades Apache Tika from 3.2.3 to 3.3.0 to address the security vulnerability GHSA-72hv-8253-57qq (TIKA-4687). Closes #13601 ### Type of change - [x] Bug Fix (non-breaking change which fixes an issue) ### Changes - `Dockerfile`: Updated tika JAR filename and `TIKA_SERVER_JAR` env var from 3.2.3 to 3.3.0 - `Dockerfile.deps`: Updated tika JAR filename in COPY instruction from 3.2.3 to 3.3.0 - `download_deps.py`: Updated both Maven Central and Huawei Cloud mirror download URLs from 3.2.3 to 3.3.0 ### References - Apache Tika 3.3.0 release: https://www.apache.org/dyn/closer.lua/tika/3.3.0/tika-app-3.3.0.jar - TIKA-4687: https://issues.apache.org/jira/browse/TIKA-4687 - GHSA-72hv-8253-57qq
This commit is contained in:
committed by
GitHub
parent
3e787b3b09
commit
5ece2d8aa8
@@ -19,16 +19,16 @@ RUN --mount=type=bind,from=infiniflow/ragflow_deps:latest,source=/huggingface.co
|
||||
# This is the only way to run python-tika without internet access. Without this set, the default is to check the tika version and pull latest every time from Apache.
|
||||
RUN --mount=type=bind,from=infiniflow/ragflow_deps:latest,source=/,target=/deps \
|
||||
cp -r /deps/nltk_data /root/ && \
|
||||
cp /deps/tika-server-standard-3.2.3.jar /deps/tika-server-standard-3.2.3.jar.md5 /ragflow/ && \
|
||||
cp /deps/tika-server-standard-3.3.0.jar /deps/tika-server-standard-3.3.0.jar.md5 /ragflow/ && \
|
||||
cp /deps/cl100k_base.tiktoken /ragflow/9b5ad71b2ce5302211f9c61530b329a4922fc6a4
|
||||
|
||||
ENV TIKA_SERVER_JAR="file:///ragflow/tika-server-standard-3.2.3.jar"
|
||||
ENV TIKA_SERVER_JAR="file:///ragflow/tika-server-standard-3.3.0.jar"
|
||||
ENV DEBIAN_FRONTEND=noninteractive
|
||||
|
||||
# Setup apt
|
||||
# Python package and implicit dependencies:
|
||||
# opencv-python: libglib2.0-0 libglx-mesa0 libgl1
|
||||
# python-pptx: default-jdk tika-server-standard-3.2.3.jar
|
||||
# python-pptx: default-jdk tika-server-standard-3.3.0.jar
|
||||
# selenium: libatk-bridge2.0-0 chrome-linux64-121-0-6167-85
|
||||
# Building C extensions: libpython3-dev libgtk-4-1 libnss3 xdg-utils libgbm-dev
|
||||
RUN --mount=type=cache,id=ragflow_apt,target=/var/cache/apt,sharing=locked \
|
||||
|
||||
Reference in New Issue
Block a user