mirror of
https://github.com/tesseract-ocr/tesseract.git
synced 2024-12-18 11:28:51 +08:00
0e868ef377
Tha, Vie, Kan, Tel etc. There is a new overlap detector that detects when diacritics cause a big increase in textline overlap. In such cases, diacritics from overlap regions are kept separate from layout analysis completely, allowing textline formation to happen without them. The diacritics are then assigned to 0, 1 or 2 close words at the end of layout analysis, using and modifying an old noise detection data path. The stored diacritics are used or not during recognition according to the character classifier's liking for them.
43 lines
1.5 KiB
C++
43 lines
1.5 KiB
C++
/**********************************************************************
|
|
* File: tordmain.h (Formerly textordp.h)
|
|
* Description: C++ top level textord code.
|
|
* Author: Ray Smith
|
|
* Created: Tue Jul 28 17:12:33 BST 1992
|
|
*
|
|
* (C) Copyright 1992, Hewlett-Packard Ltd.
|
|
** Licensed under the Apache License, Version 2.0 (the "License");
|
|
** you may not use this file except in compliance with the License.
|
|
** You may obtain a copy of the License at
|
|
** http://www.apache.org/licenses/LICENSE-2.0
|
|
** Unless required by applicable law or agreed to in writing, software
|
|
** distributed under the License is distributed on an "AS IS" BASIS,
|
|
** WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
** See the License for the specific language governing permissions and
|
|
** limitations under the License.
|
|
*
|
|
**********************************************************************/
|
|
|
|
#ifndef TORDMAIN_H
|
|
#define TORDMAIN_H
|
|
|
|
#include <time.h>
|
|
#include "params.h"
|
|
#include "ocrblock.h"
|
|
#include "blobs.h"
|
|
#include "blobbox.h"
|
|
|
|
struct Pix;
|
|
namespace tesseract {
|
|
class Tesseract;
|
|
|
|
void SetBlobStrokeWidth(Pix* pix, BLOBNBOX* blob);
|
|
void assign_blobs_to_blocks2(Pix* pix, BLOCK_LIST *blocks,
|
|
TO_BLOCK_LIST *port_blocks);
|
|
} // namespace tesseract
|
|
|
|
void tweak_row_baseline(ROW *row,
|
|
double blshift_maxshift,
|
|
double blshift_xfraction);
|
|
|
|
#endif
|