From 9397522a2535257953d7bb190e937892b20ba197 Mon Sep 17 00:00:00 2001 From: Zaili Wang <109502517+ZailiWang@users.noreply.github.com> Date: Wed, 21 Aug 2024 22:10:59 +0800 Subject: [PATCH] Add dependency for pdf2image and OCR processing (#421) --- comps/dataprep/redis/langchain/docker/Dockerfile | 4 +++- comps/dataprep/redis/langchain_ray/docker/Dockerfile | 4 +++- comps/dataprep/redis/llama_index/docker/Dockerfile | 4 +++- 3 files changed, 9 insertions(+), 3 deletions(-) diff --git a/comps/dataprep/redis/langchain/docker/Dockerfile b/comps/dataprep/redis/langchain/docker/Dockerfile index f7fcff5a7..046524491 100644 --- a/comps/dataprep/redis/langchain/docker/Dockerfile +++ b/comps/dataprep/redis/langchain/docker/Dockerfile @@ -13,7 +13,9 @@ RUN apt-get update -y && apt-get install -y --no-install-recommends --fix-missin libgl1-mesa-glx \ libjemalloc-dev \ default-jre \ - vim + vim \ + poppler-utils \ + tesseract-ocr RUN useradd -m -s /bin/bash user && \ mkdir -p /home/user && \ diff --git a/comps/dataprep/redis/langchain_ray/docker/Dockerfile b/comps/dataprep/redis/langchain_ray/docker/Dockerfile index e5c27cb34..f9f91521f 100644 --- a/comps/dataprep/redis/langchain_ray/docker/Dockerfile +++ b/comps/dataprep/redis/langchain_ray/docker/Dockerfile @@ -13,7 +13,9 @@ RUN apt-get update -y && apt-get install -y --no-install-recommends --fix-missin libgl1-mesa-glx \ libjemalloc-dev \ vim \ - libcairo2 + libcairo2 \ + poppler-utils \ + tesseract-ocr RUN useradd -m -s /bin/bash user && \ mkdir -p /home/user && \ diff --git a/comps/dataprep/redis/llama_index/docker/Dockerfile b/comps/dataprep/redis/llama_index/docker/Dockerfile index 1bf0e8d4a..111bdbd0b 100644 --- a/comps/dataprep/redis/llama_index/docker/Dockerfile +++ b/comps/dataprep/redis/llama_index/docker/Dockerfile @@ -13,7 +13,9 @@ RUN apt-get update -y && apt-get install -y --no-install-recommends --fix-missin libgl1-mesa-glx \ libjemalloc-dev \ vim \ - libcairo2 + libcairo2 \ + poppler-utils \ + tesseract-ocr RUN useradd -m -s /bin/bash user && \ mkdir -p /home/user && \