fulltext search for documents

optional fulltext search for documents using elasticsearch
text is extracted from pdfs and via ocr from images
This commit is contained in:
j 2019-11-17 13:02:12 +01:00
commit fe023c2f97
6 changed files with 102 additions and 2 deletions

View file

@ -91,6 +91,7 @@ apt-get install -y \
python3-lxml \
python3-html5lib \
python3-ox \
python3-elasticsearch \
oxframe \
ffmpeg \
mkvtoolnix \
@ -98,6 +99,8 @@ apt-get install -y \
imagemagick \
poppler-utils \
ipython3 \
tesseract-ocr \
tesseract-ocr-eng \
postfix \
postgresql-client $EXTRA