mirror of
https://github.com/tesseract-ocr/tesseract.git
synced 2024-12-23 23:17:49 +08:00
fb2e23f6de
git-svn-id: https://tesseract-ocr.googlecode.com/svn/trunk@41 d0cd1f9f-072b-0410-8dd7-cf729c803f20
263 lines
9.0 KiB
C++
263 lines
9.0 KiB
C++
/******************************************************************************
|
|
** Filename: outfeat.c
|
|
** Purpose: Definition of outline-features.
|
|
** Author: Dan Johnson
|
|
** History: 11/13/90, DSJ, Created.
|
|
**
|
|
** (c) Copyright Hewlett-Packard Company, 1988.
|
|
** Licensed under the Apache License, Version 2.0 (the "License");
|
|
** you may not use this file except in compliance with the License.
|
|
** You may obtain a copy of the License at
|
|
** http://www.apache.org/licenses/LICENSE-2.0
|
|
** Unless required by applicable law or agreed to in writing, software
|
|
** distributed under the License is distributed on an "AS IS" BASIS,
|
|
** WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
** See the License for the specific language governing permissions and
|
|
** limitations under the License.
|
|
******************************************************************************/
|
|
/**----------------------------------------------------------------------------
|
|
Include Files and Type Defines
|
|
----------------------------------------------------------------------------**/
|
|
#include "outfeat.h"
|
|
#include "mfoutline.h"
|
|
#include "variables.h"
|
|
#include "sigmenu.h"
|
|
|
|
#include "ocrfeatures.h" //Debug
|
|
#include <stdio.h> //Debug
|
|
#include "efio.h" //Debug
|
|
//#include "christydbg.h"
|
|
|
|
/**----------------------------------------------------------------------------
|
|
Private Function Prototypes
|
|
----------------------------------------------------------------------------**/
|
|
/*
|
|
#if defined(__STDC__) || defined(__cplusplus)
|
|
# define _ARGS(s) s
|
|
#else
|
|
# define _ARGS(s) ()
|
|
#endif*/
|
|
|
|
/* /users/danj/wiseowl/src/danj/microfeatures/outfeat.c
|
|
void AddOutlineFeatureToSet
|
|
_ARGS((FPOINT *Start,
|
|
FPOINT *End,
|
|
FEATURE_SET FeatureSet));
|
|
|
|
void ConvertToOutlineFeatures
|
|
_ARGS((MFOUTLINE Outline,
|
|
FEATURE_SET FeatureSet));
|
|
|
|
void NormalizeOutlineX
|
|
_ARGS((FEATURE_SET FeatureSet));
|
|
|
|
#undef _ARGS
|
|
*/
|
|
/**----------------------------------------------------------------------------
|
|
Global Data Definitions and Declarations
|
|
----------------------------------------------------------------------------**/
|
|
/**----------------------------------------------------------------------------
|
|
Public Code
|
|
----------------------------------------------------------------------------**/
|
|
/*---------------------------------------------------------------------------*/
|
|
FEATURE_SET ExtractOutlineFeatures(TBLOB *Blob, LINE_STATS *LineStats) {
|
|
/*
|
|
** Parameters:
|
|
** Blob blob to extract pico-features from
|
|
** LineStats statistics on text row blob is in
|
|
** Globals: none
|
|
** Operation: Convert each segment in the outline to a feature
|
|
** and return the features.
|
|
** Return: Outline-features for Blob.
|
|
** Exceptions: none
|
|
** History: 11/13/90, DSJ, Created.
|
|
** 05/24/91, DSJ, Updated for either char or baseline normalize.
|
|
*/
|
|
LIST Outlines;
|
|
LIST RemainingOutlines;
|
|
MFOUTLINE Outline;
|
|
FEATURE_SET FeatureSet;
|
|
FLOAT32 XScale, YScale;
|
|
|
|
FeatureSet = NewFeatureSet (MAX_OUTLINE_FEATURES);
|
|
if (Blob == NULL)
|
|
return (FeatureSet);
|
|
|
|
Outlines = ConvertBlob (Blob);
|
|
|
|
NormalizeOutlines(Outlines, LineStats, &XScale, &YScale);
|
|
RemainingOutlines = Outlines;
|
|
iterate(RemainingOutlines) {
|
|
Outline = (MFOUTLINE) first_node (RemainingOutlines);
|
|
/*---------Debug--------------------------------------------------*
|
|
OFile = fopen ("f:/ims/debug/ofOutline.logCPP", "r");
|
|
if (OFile == NULL)
|
|
{
|
|
OFile = Efopen ("f:/ims/debug/ofOutline.logCPP", "w");
|
|
WriteOutline(OFile, Outline);
|
|
}
|
|
else
|
|
{
|
|
fclose (OFile);
|
|
OFile = Efopen ("f:/ims/debug/ofOutline.logCPP", "a");
|
|
}
|
|
WriteOutline(OFile, Outline);
|
|
fclose (OFile);
|
|
*--------------------------------------------------------------------*/
|
|
ConvertToOutlineFeatures(Outline, FeatureSet);
|
|
}
|
|
if (NormMethod == baseline)
|
|
NormalizeOutlineX(FeatureSet);
|
|
/*---------Debug--------------------------------------------------*
|
|
File = fopen ("f:/ims/debug/ofFeatSet.logCPP", "r");
|
|
if (File == NULL)
|
|
{
|
|
File = Efopen ("f:/ims/debug/ofFeatSet.logCPP", "w");
|
|
WriteFeatureSet(File, FeatureSet);
|
|
}
|
|
else
|
|
{
|
|
fclose (File);
|
|
File = Efopen ("f:/ims/debug/ofFeatSet.logCPP", "a");
|
|
}
|
|
WriteFeatureSet(File, FeatureSet);
|
|
fclose (File);
|
|
*--------------------------------------------------------------------*/
|
|
FreeOutlines(Outlines);
|
|
return (FeatureSet);
|
|
} /* ExtractOutlineFeatures */
|
|
|
|
|
|
/*---------------------------------------------------------------------------*/
|
|
void InitOutlineFXVars() {
|
|
//once contained a dummy
|
|
/*
|
|
** Parameters: none
|
|
** Globals: none
|
|
** Operation: Initialize the outline-feature extractor variables that can
|
|
** be tuned without recompiling.
|
|
** Return: none
|
|
** Exceptions: none
|
|
** History: 11/13/90, DSJ, Created.
|
|
*/
|
|
} /* InitOutlineFXVars */
|
|
|
|
|
|
/**----------------------------------------------------------------------------
|
|
Private Code
|
|
----------------------------------------------------------------------------**/
|
|
/*---------------------------------------------------------------------------*/
|
|
void AddOutlineFeatureToSet(FPOINT *Start,
|
|
FPOINT *End,
|
|
FEATURE_SET FeatureSet) {
|
|
/*
|
|
** Parameters:
|
|
** Start starting point of outline-feature
|
|
** End ending point of outline-feature
|
|
** FeatureSet set to add outline-feature to
|
|
** Globals: none
|
|
** Operation: This routine computes the midpoint between Start and
|
|
** End to obtain the x,y position of the outline-feature. It
|
|
** also computes the direction from Start to End as the
|
|
** direction of the outline-feature and the distance from
|
|
** Start to End as the length of the outline-feature.
|
|
** This feature is then
|
|
** inserted into the next feature slot in FeatureSet.
|
|
** Return: none (results are placed in FeatureSet)
|
|
** Exceptions: none
|
|
** History: 11/13/90, DSJ, Created.
|
|
*/
|
|
FEATURE Feature;
|
|
|
|
Feature = NewFeature (&OutlineFeatDesc);
|
|
ParamOf (Feature, OutlineFeatDir) = NormalizedAngleFrom (Start, End, 1.0);
|
|
ParamOf (Feature, OutlineFeatX) = AverageOf (Xof (*Start), Xof (*End));
|
|
ParamOf (Feature, OutlineFeatY) = AverageOf (Yof (*Start), Yof (*End));
|
|
ParamOf (Feature, OutlineFeatLength) = DistanceBetween (*Start, *End);
|
|
AddFeature(FeatureSet, Feature);
|
|
|
|
} /* AddOutlineFeatureToSet */
|
|
|
|
|
|
/*---------------------------------------------------------------------------*/
|
|
void ConvertToOutlineFeatures(MFOUTLINE Outline, FEATURE_SET FeatureSet) {
|
|
/*
|
|
** Parameters:
|
|
** Outline outline to extract outline-features from
|
|
** FeatureSet set of features to add outline-features to
|
|
** Globals: none
|
|
** Operation:
|
|
** This routine steps converts each section in the specified
|
|
** outline to a feature described by its x,y position, length
|
|
** and angle.
|
|
** Return: none (results are returned in FeatureSet)
|
|
** Exceptions: none
|
|
** History: 11/13/90, DSJ, Created.
|
|
** 5/24/91, DSJ, Added hidden edge capability.
|
|
*/
|
|
MFOUTLINE Next;
|
|
MFOUTLINE First;
|
|
FPOINT FeatureStart;
|
|
FPOINT FeatureEnd;
|
|
|
|
if (DegenerateOutline (Outline))
|
|
return;
|
|
|
|
First = Outline;
|
|
Next = First;
|
|
do {
|
|
CopyPoint (PositionOf (PointAt (Next)), FeatureStart);
|
|
Next = NextPointAfter (Next);
|
|
|
|
/* note that an edge is hidden if the ending point of the edge is
|
|
marked as hidden. This situation happens because the order of
|
|
the outlines is reversed when they are converted from the old
|
|
format. In the old format, a hidden edge is marked by the
|
|
starting point for that edge. */
|
|
if (IsVisible (PointAt (Next))) {
|
|
CopyPoint (PositionOf (PointAt (Next)), FeatureEnd);
|
|
AddOutlineFeatureToSet(&FeatureStart, &FeatureEnd, FeatureSet);
|
|
}
|
|
}
|
|
while (Next != First);
|
|
} /* ConvertToOutlineFeatures */
|
|
|
|
|
|
/*---------------------------------------------------------------------------*/
|
|
void NormalizeOutlineX(FEATURE_SET FeatureSet) {
|
|
/*
|
|
** Parameters:
|
|
** FeatureSet outline-features to be normalized
|
|
** Globals: none
|
|
** Operation: This routine computes the weighted average x position
|
|
** over all of the outline-features in FeatureSet and then
|
|
** renormalizes the outline-features to force this average
|
|
** to be the x origin (i.e. x=0).
|
|
** Return: none (FeatureSet is changed)
|
|
** Exceptions: none
|
|
** History: 11/13/90, DSJ, Created.
|
|
*/
|
|
int i;
|
|
FEATURE Feature;
|
|
FLOAT32 Length;
|
|
FLOAT32 TotalX = 0.0;
|
|
FLOAT32 TotalWeight = 0.0;
|
|
FLOAT32 Origin;
|
|
|
|
if (NumFeaturesIn (FeatureSet) <= 0)
|
|
return;
|
|
|
|
for (i = 0; i < NumFeaturesIn (FeatureSet); i++) {
|
|
Feature = FeatureIn (FeatureSet, i);
|
|
Length = ParamOf (Feature, OutlineFeatLength);
|
|
TotalX += ParamOf (Feature, OutlineFeatX) * Length;
|
|
TotalWeight += Length;
|
|
}
|
|
Origin = TotalX / TotalWeight;
|
|
|
|
for (i = 0; i < NumFeaturesIn (FeatureSet); i++) {
|
|
Feature = FeatureIn (FeatureSet, i);
|
|
ParamOf (Feature, OutlineFeatX) -= Origin;
|
|
}
|
|
} /* NormalizeOutlineX */
|