Skip to content
Snippets Groups Projects
Commit ed867d95 authored by Dominik Schachten's avatar Dominik Schachten
Browse files

Update Dockerfile

parent 50bf8778
No related branches found
No related tags found
No related merge requests found
Pipeline #
FROM debian:testing
FROM jbarlow83/ocrmypdf
RUN export LC_ALL=C.UTF-8
RUN export LANG=C.UTF-8
RUN apt-get -yq update && apt-get -yq install pngquant unpaper python3 python3-pip exempi qpdf ghostscript git autotools-dev automake libtool libleptonica-dev zlibc zlib1g zlib1g-dev wget
RUN apt-get -yq install tesseract-ocr tesseract-ocr-deu
RUN pip3 install ocrmypdf
RUN git clone https://github.com/agl/jbig2enc && cd jbig2enc && ./autogen.sh && ./configure && make && make install && cd ..
RUN wget https://github.com/tesseract-ocr/tessdata_best/blob/master/deu.traineddata?raw=true
RUN mv deu.traineddata?raw=true /usr/share/tesseract-ocr/4.00/tessdata/deu.traineddata
RUN apt-get -yq update && apt-get -yq install pngquant unpaper python3 python3-pip exempi qpdf ghostscript git autotools-dev automake libtool libleptonica-dev zlibc zlib1g zlib1g-dev wget scantailor
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Please register or to comment