# HG changeset patch # User Oleksandr Gavenko # Date 1323773558 -7200 # Node ID 8d9c9a102827b3d84102a614712c5b2c9a9229f5 # Parent d98ac8df0e854581a4116d29c43875708e0c1f00 About OCR program. diff -r d98ac8df0e85 -r 8d9c9a102827 ocr.rst --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/ocr.rst Tue Dec 13 12:52:38 2011 +0200 @@ -0,0 +1,49 @@ + +====== + OCS. +====== + +gocr. +===== + + $ gocr $IN.pnm >$OUT.txt + +ocrfeeder. +========== + +Document layout analysis and optical character recognition system:: + + $ sudo apt-get install ocrfeeder + +Using:: + + $ ocrfeeder-cli --o $OUTDIR --format HTML --images $IN.pnm + +tesseract. +========== + +Installing:: + + $ sudo apt-get install tesseract-ocr + +Using:: + + $ tesseract $IN.tif $OUT + $ cat $OUT.txt + +ocropus. +======== + + $ ocropus hocr-to-text screen.ppm + +ocrad +===== + +Optical Character Recognition program:: + + $ sudo apt-get install ocrad + +Misc. +===== + +unpapper