2017-08-19 21:12:06 +08:00
|
|
|
///////////////////////////////////////////////////////////////////////
|
2017-08-19 21:16:23 +08:00
|
|
|
// File: apiexample_test.cc
|
2017-08-19 21:12:06 +08:00
|
|
|
// Description: Api Example for Tesseract.
|
|
|
|
// Author: ShreeDevi Kumar
|
|
|
|
//
|
|
|
|
// Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
// you may not use this file except in compliance with the License.
|
|
|
|
// You may obtain a copy of the License at
|
|
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
// Unless required by applicable law or agreed to in writing, software
|
|
|
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
// See the License for the specific language governing permissions and
|
|
|
|
// limitations under the License.
|
|
|
|
///////////////////////////////////////////////////////////////////////
|
|
|
|
#include "gtest/gtest.h"
|
|
|
|
#include "tesseract/baseapi.h"
|
|
|
|
#include "leptonica/allheaders.h"
|
|
|
|
#include <iostream>
|
|
|
|
#include <string>
|
|
|
|
#include <fstream>
|
|
|
|
#include <locale>
|
|
|
|
|
|
|
|
TEST(TesseractTest, ApiExample)
|
|
|
|
{
|
|
|
|
char *outText;
|
2017-08-19 21:16:23 +08:00
|
|
|
std::locale loc("en_US.UTF-8"); // You can also use "" for the default system locale
|
2017-09-04 13:14:43 +08:00
|
|
|
std::ifstream file("../testing/phototest.txt");
|
2017-08-19 21:16:23 +08:00
|
|
|
file.imbue(loc); // Use it for file input
|
2017-08-19 21:12:06 +08:00
|
|
|
std::string gtText((std::istreambuf_iterator<char>(file)),
|
|
|
|
std::istreambuf_iterator<char>());
|
2017-08-19 21:16:23 +08:00
|
|
|
|
2017-08-19 21:12:06 +08:00
|
|
|
tesseract::TessBaseAPI *api = new tesseract::TessBaseAPI();
|
2017-08-19 21:16:23 +08:00
|
|
|
// Initialize tesseract-ocr with English, without specifying tessdata path
|
2017-08-19 21:12:06 +08:00
|
|
|
if (api->Init(NULL, "eng")) {
|
|
|
|
fprintf(stderr, "Could not initialize tesseract.\n");
|
|
|
|
exit(1);
|
|
|
|
}
|
2017-08-19 21:16:23 +08:00
|
|
|
|
|
|
|
// Open input image with leptonica library
|
|
|
|
Pix *image = pixRead("../testing/phototest.tif");
|
2017-08-19 21:12:06 +08:00
|
|
|
api->SetImage(image);
|
2017-08-19 21:16:23 +08:00
|
|
|
// Get OCR result
|
2017-08-19 21:12:06 +08:00
|
|
|
outText = api->GetUTF8Text();
|
2017-08-19 21:16:23 +08:00
|
|
|
|
|
|
|
ASSERT_EQ(gtText,outText) << "Phototest.tif with default values OCR does not match ground truth";
|
|
|
|
|
|
|
|
// Destroy used object and release memory
|
2017-08-19 21:12:06 +08:00
|
|
|
api->End();
|
|
|
|
delete [] outText;
|
|
|
|
pixDestroy(&image);
|
2017-08-19 21:16:23 +08:00
|
|
|
|
2017-08-19 21:12:06 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
int main(int argc, char **argv) {
|
|
|
|
::testing::InitGoogleTest(&argc, argv);
|
|
|
|
return RUN_ALL_TESTS();
|
2017-08-19 21:16:23 +08:00
|
|
|
}
|