From bf65f15d04b5fd8fb0409d185e380e9db10772f7 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Jos=C3=A9=20Guilherme=20Vanz?= Date: Wed, 2 Dec 2020 23:52:50 -0300 Subject: [PATCH] Install Tesseract dependency MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Changes the Dockerfile of the container used to run the tests. It is necessary to install Tesseract to allow the OCR to work. Signed-off-by: José Guilherme Vanz --- Dockerfile | 10 +++++----- 1 file changed, 5 insertions(+), 5 deletions(-) diff --git a/Dockerfile b/Dockerfile index 645faca..7b9506a 100644 --- a/Dockerfile +++ b/Dockerfile @@ -3,7 +3,11 @@ FROM python:3.8 RUN adduser --system gazette RUN apt-get update -y -RUN apt-get -y install default-jre wait-for-it +RUN apt-get -y install default-jre wait-for-it libtesseract4 tesseract-ocr-por + +# install Apache Tika +ADD http://archive.apache.org/dist/tika/tika-app-1.24.jar /tika-app.jar +RUN chmod 755 /tika-app.jar RUN mkdir /mnt/code COPY . /mnt/code @@ -12,9 +16,5 @@ ENV PYTHONPATH=/mnt/code RUN pip install --no-cache-dir -r requirements.txt -# install Apache Tika -ADD http://archive.apache.org/dist/tika/tika-app-1.24.jar /tika-app.jar -RUN chmod 755 /tika-app.jar - USER gazette