@@ -25,7 +25,7 @@ RUN apt-get -qq -y update \
2525 libtiff5-dev libjpeg-dev libfreetype6-dev libwebp-dev \
2626 libtiff-tools ghostscript librsvg2-bin jbig2dec \
2727 pst-utils \
28- # ## tesseract
28+ # ## tesseract
2929 tesseract-ocr-eng \
3030 tesseract-ocr-swa \
3131 tesseract-ocr-swe \
@@ -96,7 +96,7 @@ RUN apt-get -qq -y update \
9696 tesseract-ocr-aze \
9797 tesseract-ocr-bel \
9898 tesseract-ocr-uzb \
99- # ## pdf convert: libreoffice + a bunch of fonts
99+ # ## pdf convert: libreoffice + a bunch of fonts
100100 libreoffice fonts-opensymbol hyphen-fr hyphen-de \
101101 hyphen-en-us hyphen-it hyphen-ru fonts-dejavu fonts-dejavu-core fonts-dejavu-extra \
102102 fonts-droid-fallback fonts-dustin fonts-f500 fonts-fanwood fonts-freefont-ttf \
@@ -126,7 +126,7 @@ RUN mkdir /models/ && \
126126COPY requirements.txt /tmp/
127127RUN pip3 install --no-cache-dir --prefer-binary --upgrade pip
128128RUN pip3 install --no-cache-dir --prefer-binary --upgrade setuptools wheel
129- RUN pip3 install --no-cache-dir --prefer -binary -r /tmp/requirements.txt
129+ RUN pip3 install --no-cache-dir --no -binary "tesserocr" -r /tmp/requirements.txt
130130
131131# Install spaCy models
132132RUN python3 -m spacy download en_core_web_sm \
@@ -136,7 +136,7 @@ RUN python3 -m spacy download en_core_web_sm \
136136RUN python3 -m spacy download ru_core_news_sm \
137137 && python3 -m spacy download pt_core_news_sm \
138138 && python3 -m spacy download ro_core_news_sm \
139- && python3 -m spacy download mk_core_news_sm
139+ && python3 -m spacy download mk_core_news_sm
140140RUN python3 -m spacy download el_core_news_sm \
141141 && python3 -m spacy download pl_core_news_sm \
142142 && python3 -m spacy download it_core_news_sm \
0 commit comments