- Timestamp:
- 2020-06-16T17:20:50+12:00 (4 years ago)
- File:
-
- 1 edited
Legend:
- Unmodified
- Added
- Removed
-
gs2-extensions/tesseract/trunk/src/packages/CASCADE-MAKE/TESSERACT.sh
r34186 r34190 45 45 46 46 echo "Installing basic tesseract languages support (tessdata)" 47 cp $GEXTTESS_DEVEL/packages/tessdata-langs.tar.gz $GEXTTESS_INSTALLED/. 48 pushd $GEXTTESS_INSTALLED 47 # Untar OCR language support tarball one level above TESSDATA_PREFIX ($GEXTTESS_INSTALLED/shared), 48 # Then go into that folder to finish setting up language files. 49 cp $GEXTTESS_DEVEL/packages/tessdata-langs.tar.gz $TESSDATA_PREFIX/../. 50 pushd $TESSDATA_PREFIX/.. 49 51 tar -xvzf tessdata-langs.tar.gz 52 # Above creates linux/shared/tessdata-langs folder - move files there into 53 # linux/shared/tessdata (i.e. TESSDATA_PREFIX) and delete both tarball and temporary 54 # tessdata-langs folder created at current location of one level up from TESSDATA_PREFIX 55 mv tessdata-langs/*.traineddata $TESSDATA_PREFIX/. 50 56 rm tessdata-langs.tar.gz 51 mkdir -p tessdata/tessconfigs57 rm -rf tessdata-langs 52 58 popd 53 59 54 # Not sure why source package's tessdata didn't get installed in installdir55 # despite exporting TESSDATA_PREFIX at the start at cascade-make process.56 cp -r $package$version/tessdata/configs $GEXTTESS_INSTALLED/tessdata/57 cp $package$version/tessdata/eng.user-patterns $GEXTTESS_INSTALLED/tessdata/.58 cp $package$version/tessdata/eng.user-words $GEXTTESS_INSTALLED/tessdata/.59 cp $package$version/tessdata/tessconfigs/*batch* $GEXTTESS_INSTALLED/tessdata/tessconfigs/.60 cp $package$version/tessdata/tessconfigs/*demo* $GEXTTESS_INSTALLED/tessdata/tessconfigs/.61 60 62 63 echo "Done installing basic tesseract languages" 64 echo "Visit https://github.com/tesseract-ocr/tessdata for a full list of trained language data." 65 echo "To download support for any specific language(s), note the 3 letter code of that language" 66 echo "Go into your $GEXTTESS_INSTALLED/tessdata and for each language run: " 61 echo "Done installing basic tesseract languages for OCR (Optical Character Recognition, to recognise text from images)." 62 echo "Visit https://github.com/tesseract-ocr/tessdata for a full list of trained language data for OCR." 63 echo "To download OCR support for any specific language(s), note the 3 letter code of that language" 64 echo "Go into your $TESSDATA_PREFIX folder and for each language you want OCR abilities for, run: " 67 65 echo " wget https://github.com/tesseract-ocr/tessdata/raw/master/<3-letter-lang-code>.traineddata" 68 echo "To get all languages currently supported by Tesseract , delete"69 echo "$ GEXTTESS_INSTALLED/tessdata"70 echo "and in $GEXTTES_INSTALLED run:"66 echo "To get all languages currently supported by Tesseract (beware, this may be a few Gigabytes), delete" 67 echo "$TESSDATA_PREFIX" 68 echo "and in $GEXTTES_INSTALLED/shared run:" 71 69 echo " git clone https://github.com/tesseract-ocr/tessdata" 72 70 echo ""
Note:
See TracChangeset
for help on using the changeset viewer.