mirror of https://github.com/google/oss-fuzz.git
[tesseract-ocr] Add Tesseract (#2210)
* Add Tesseract * Use -lz instead of static library path * Disable Tesseract shared build * Minimal repository cloning (--depth 1) * Improve tessdata directory resolution syntax * Don't hardcode TESSDATA_PREFIX into binary * Don't move, but copy $SRC/tessdata to $OUT Move sometimes results in "inter-device move failed"
This commit is contained in:
parent
166745e25d
commit
bf5caa86c3
|
@ -0,0 +1,24 @@
|
|||
# Copyright 2019 Google Inc.
|
||||
#
|
||||
# Licensed under the Apache License, Version 2.0 (the "License");
|
||||
# you may not use this file except in compliance with the License.
|
||||
# You may obtain a copy of the License at
|
||||
#
|
||||
# http://www.apache.org/licenses/LICENSE-2.0
|
||||
#
|
||||
# Unless required by applicable law or agreed to in writing, software
|
||||
# distributed under the License is distributed on an "AS IS" BASIS,
|
||||
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
# See the License for the specific language governing permissions and
|
||||
# limitations under the License.
|
||||
#
|
||||
################################################################################
|
||||
|
||||
FROM gcr.io/oss-fuzz-base/base-builder
|
||||
MAINTAINER guidovranken@gmail.com
|
||||
RUN apt-get update && apt-get install -y autoconf automake libtool pkg-config libpng-dev libjpeg8-dev libtiff5-dev zlib1g-dev wget
|
||||
RUN wget https://github.com/DanBloomberg/leptonica/releases/download/1.77.0/leptonica-1.77.0.tar.gz
|
||||
RUN git clone --depth 1 https://github.com/tesseract-ocr/tesseract
|
||||
RUN git clone --depth 1 https://github.com/tesseract-ocr/tessdata
|
||||
RUN git clone https://github.com/guidovranken/tesseract-ocr-fuzzers
|
||||
COPY build.sh $SRC/
|
|
@ -0,0 +1,49 @@
|
|||
#!/bin/bash -eu
|
||||
# Copyright 2019 Google Inc.
|
||||
#
|
||||
# Licensed under the Apache License, Version 2.0 (the "License");
|
||||
# you may not use this file except in compliance with the License.
|
||||
# You may obtain a copy of the License at
|
||||
#
|
||||
# http://www.apache.org/licenses/LICENSE-2.0
|
||||
#
|
||||
# Unless required by applicable law or agreed to in writing, software
|
||||
# distributed under the License is distributed on an "AS IS" BASIS,
|
||||
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
# See the License for the specific language governing permissions and
|
||||
# limitations under the License.
|
||||
#
|
||||
################################################################################
|
||||
|
||||
cd $SRC
|
||||
tar zxf leptonica-1.77.0.tar.gz
|
||||
cd leptonica-1.77.0
|
||||
./configure
|
||||
make -j$(nproc)
|
||||
make install
|
||||
ldconfig
|
||||
|
||||
cd $SRC/tesseract
|
||||
./autogen.sh
|
||||
CXXFLAGS="$CXXFLAGS -D_GLIBCXX_DEBUG" ./configure --disable-graphics --disable-shared
|
||||
make -j$(nproc)
|
||||
|
||||
cd $SRC/tesseract-ocr-fuzzers
|
||||
|
||||
cp -R $SRC/tessdata $OUT
|
||||
|
||||
$CXX $CXXFLAGS \
|
||||
-I $SRC/tesseract/src/api \
|
||||
-I $SRC/tesseract/src/ccstruct \
|
||||
-I $SRC/tesseract/src/ccmain \
|
||||
-I $SRC/tesseract/src/ccutil \
|
||||
$SRC/tesseract-ocr-fuzzers/fuzzer-api.cpp -o $OUT/fuzzer-api \
|
||||
$SRC/tesseract/src/api/.libs/libtesseract.a \
|
||||
/usr/local/lib/liblept.a \
|
||||
/usr/lib/x86_64-linux-gnu/libtiff.a \
|
||||
/usr/lib/x86_64-linux-gnu/libpng.a \
|
||||
/usr/lib/x86_64-linux-gnu/libjpeg.a \
|
||||
/usr/lib/x86_64-linux-gnu/libjbig.a \
|
||||
/usr/lib/x86_64-linux-gnu/liblzma.a \
|
||||
-lz \
|
||||
-lFuzzingEngine
|
|
@ -0,0 +1,2 @@
|
|||
homepage: "https://github.com/tesseract-ocr/tesseract"
|
||||
primary_contact: "stjoweil@googlemail.com"
|
Loading…
Reference in New Issue