mirror of
https://github.com/tesseract-ocr/tesseract.git
synced 2025-01-06 01:07:49 +08:00
1c7e00611b
This requires libarchive-dev. Tesseract can now load traineddata files in any of the archive formats which are supported by libarchive. Example of a zipped BagIt archive: $ unzip -l /usr/local/share/tessdata/zip.traineddata Archive: /usr/local/share/tessdata/zip.traineddata Length Date Time Name --------- ---------- ----- ---- 55 2019-03-05 15:27 bagit.txt 0 2019-03-05 15:25 data/ 1557 2019-03-05 15:28 manifest-sha256.txt 1082890 2019-03-05 15:25 data/eng.word-dawg 1487588 2019-03-05 15:25 data/eng.lstm 7477 2019-03-05 15:25 data/eng.unicharset 63346 2019-03-05 15:25 data/eng.shapetable 976552 2019-03-05 15:25 data/eng.inttemp 13408 2019-03-05 15:25 data/eng.normproto 4322 2019-03-05 15:25 data/eng.punc-dawg 4738 2019-03-05 15:25 data/eng.lstm-number-dawg 1410 2019-03-05 15:25 data/eng.freq-dawg 844 2019-03-05 15:25 data/eng.pffmtable 6360 2019-03-05 15:25 data/eng.lstm-unicharset 1012 2019-03-05 15:25 data/eng.lstm-recoder 1047 2019-03-05 15:25 data/eng.unicharambigs 4322 2019-03-05 15:25 data/eng.lstm-punc-dawg 16109842 2019-03-05 15:25 data/eng.bigram-dawg 80 2019-03-05 15:25 data/eng.version 6426 2019-03-05 15:25 data/eng.number-dawg 3694794 2019-03-05 15:25 data/eng.lstm-word-dawg --------- ------- 23468070 21 files `combine_tessdata -d` and `combine_tessdata -u` also work. The traineddata files in the new format can be generated with standard tools like zip or tar. More work is needed for other training tools and big endian support. Signed-off-by: Stefan Weil <sw@weilnetz.de>
57 lines
1.3 KiB
YAML
57 lines
1.3 KiB
YAML
# Travis CI configuration for Tesseract
|
|
|
|
language: cpp
|
|
|
|
dist: trusty
|
|
|
|
env:
|
|
- LEPT_VER=1.77.0
|
|
|
|
notifications:
|
|
email: false
|
|
|
|
sudo: false
|
|
|
|
os:
|
|
- linux
|
|
- osx
|
|
|
|
addons:
|
|
apt:
|
|
sources:
|
|
#- ubuntu-toolchain-r-test
|
|
packages:
|
|
- libarchive-dev
|
|
#- g++-6
|
|
|
|
#matrix:
|
|
#include:
|
|
#- os: osx
|
|
#install:
|
|
#script: brew install tesseract --HEAD
|
|
#cache:
|
|
#directories:
|
|
#- $HOME/Library/Caches/Homebrew
|
|
#allow_failures:
|
|
#- script: brew install tesseract --HEAD
|
|
|
|
cache:
|
|
directories:
|
|
- leptonica-$LEPT_VER
|
|
|
|
before_install:
|
|
- if [[ $TRAVIS_OS_NAME == linux ]]; then LINUX=true; fi
|
|
- if [[ $TRAVIS_OS_NAME == osx ]]; then OSX=true; fi
|
|
|
|
install:
|
|
#- if [[ $LINUX && "$CXX" = "g++" ]]; then export CXX="g++-6" CC="gcc-6"; fi
|
|
- if test ! -d leptonica-$LEPT_VER/src; then curl -Ls https://github.com/DanBloomberg/leptonica/archive/$LEPT_VER.tar.gz | tar -xz; fi
|
|
- if test ! -d leptonica-$LEPT_VER/usr; then cmake -Hleptonica-$LEPT_VER -Bleptonica-$LEPT_VER/build -DCMAKE_INSTALL_PREFIX=leptonica-$LEPT_VER/usr; fi
|
|
- if test ! -e leptonica-$LEPT_VER/usr/lib/libleptonica.so; then make -C leptonica-$LEPT_VER/build install; fi
|
|
|
|
script:
|
|
- mkdir build
|
|
- cd build
|
|
- cmake .. -DLeptonica_DIR=leptonica-$LEPT_VER/build -DCPPAN_BUILD=OFF
|
|
- make
|