Compare commits
No commits in common. "4c6b1a936de838ffb427e54473be8952f457b2c2" and "4db0055103f5811a4f9b2d2558b56c0b78372f99" have entirely different histories.
4c6b1a936d
...
4db0055103
@ -1,3 +0,0 @@
|
|||||||
# OCR test grounds
|
|
||||||
|
|
||||||
Experimenting with open-source OCR software.
|
|
||||||
@ -1,16 +0,0 @@
|
|||||||
FROM ubuntu:18.04
|
|
||||||
|
|
||||||
ENV LANG C.UTF-8
|
|
||||||
ENV LC_ALL C.UTF-8
|
|
||||||
|
|
||||||
RUN apt-get update && apt-get install -y software-properties-common && add-apt-repository -y ppa:alex-p/tesseract-ocr
|
|
||||||
RUN apt-get update && apt-get install -y \
|
|
||||||
imagemagick \
|
|
||||||
tesseract-ocr \
|
|
||||||
tesseract-ocr-eng \
|
|
||||||
tesseract-ocr-nor
|
|
||||||
|
|
||||||
COPY ocr.sh /bin/ocr.sh
|
|
||||||
RUN chmod +x /bin/ocr.sh
|
|
||||||
|
|
||||||
ENTRYPOINT ["tesseract"]
|
|
||||||
@ -1,5 +0,0 @@
|
|||||||
#!/bin/sh
|
|
||||||
|
|
||||||
convert -colorspace gray -fill white -resize 5000x -sharpen 0x1 $1 /tmp/image.jpg
|
|
||||||
tesseract -l nor /tmp/image.jpg /tmp/out
|
|
||||||
cat /tmp/out*
|
|
||||||
Loading…
x
Reference in New Issue
Block a user