mirror of
https://github.com/tesseract-ocr/tesseract.git
synced 2024-11-24 19:19:05 +08:00
570af48b8b
git-svn-id: https://tesseract-ocr.googlecode.com/svn/trunk@87 d0cd1f9f-072b-0410-8dd7-cf729c803f20
146 lines
4.9 KiB
C
146 lines
4.9 KiB
C
/******************************************************************************
|
|
** Filename: matchdefs.h
|
|
** Purpose: Generic interface definitions for feature matchers.
|
|
** Author: Dan Johnson
|
|
** History: Fri Jan 19 09:21:25 1990, DSJ, Created.
|
|
**
|
|
** (c) Copyright Hewlett-Packard Company, 1988.
|
|
** Licensed under the Apache License, Version 2.0 (the "License");
|
|
** you may not use this file except in compliance with the License.
|
|
** You may obtain a copy of the License at
|
|
** http://www.apache.org/licenses/LICENSE-2.0
|
|
** Unless required by applicable law or agreed to in writing, software
|
|
** distributed under the License is distributed on an "AS IS" BASIS,
|
|
** WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
** See the License for the specific language governing permissions and
|
|
** limitations under the License.
|
|
******************************************************************************/
|
|
#ifndef MATCHDEFS_H
|
|
#define MATCHDEFS_H
|
|
|
|
/**----------------------------------------------------------------------------
|
|
Include Files and Type Defines
|
|
----------------------------------------------------------------------------**/
|
|
#include "general.h"
|
|
#include <stdio.h>
|
|
#include "unichar.h"
|
|
|
|
/* define the maximum number of classes defined for any matcher
|
|
and the maximum class id for any matcher. This must be changed
|
|
if more different classes need to be classified */
|
|
#define MAX_NUM_CLASSES 256
|
|
#define MAX_CLASS_ID (MAX_NUM_CLASSES - 1)
|
|
|
|
/* a CLASS_ID is the ascii character to be associated with a class */
|
|
typedef UNICHAR_ID CLASS_ID;
|
|
#define NO_CLASS (0)
|
|
|
|
/* define a type for the index (rather than the class id) of a class.
|
|
Class indexes are sequentially defined, while class id's are defined
|
|
by the ascii character set. */
|
|
typedef INT16 CLASS_INDEX;
|
|
typedef CLASS_INDEX CLASS_TO_INDEX[MAX_CLASS_ID + 1];
|
|
typedef CLASS_ID INDEX_TO_CLASS[MAX_NUM_CLASSES];
|
|
#define ILLEGAL_CLASS (-1)
|
|
|
|
/* a PROTO_ID is the index of a prototype within it's class. Valid proto
|
|
id's are 0 to N-1 where N is the number of prototypes that make up the
|
|
class. */
|
|
typedef INT16 PROTO_ID;
|
|
#define NO_PROTO (-1)
|
|
|
|
/* FEATURE_ID is the index of a feature within a character description
|
|
The feature id ranges from 0 to N-1 where N is the number
|
|
of features in a character description. */
|
|
typedef UINT8 FEATURE_ID;
|
|
#define NO_FEATURE 255
|
|
#define NOISE_FEATURE 254
|
|
#define MISSING_PROTO 254
|
|
#define MAX_NUM_FEAT 40
|
|
#define MAX_FEATURE_ID 250
|
|
|
|
/* a RATING is the match rating returned by a classifier.
|
|
Higher is better. */
|
|
typedef FLOAT32 RATING;
|
|
|
|
/* a CERTAINTY is an indication of the degree of confidence of the
|
|
classifier. Higher is better. 0 means the match is as good as the
|
|
mean of the matches seen in training. -1 means the match was one
|
|
standard deviation worse than the training matches, etc. */
|
|
typedef FLOAT32 CERTAINTY;
|
|
|
|
/* define a data structure to hold a single match result */
|
|
typedef struct
|
|
{
|
|
CLASS_ID Class;
|
|
RATING Rating;
|
|
CERTAINTY Certainty;
|
|
}
|
|
|
|
|
|
MATCH_RESULT;
|
|
|
|
/* define a data structure for holding an array of match results */
|
|
typedef MATCH_RESULT SORTED_CLASSES[MAX_CLASS_ID + 1];
|
|
|
|
/**----------------------------------------------------------------------------
|
|
Public Function Prototypes
|
|
----------------------------------------------------------------------------**/
|
|
/* all feature matchers that are to be used with the high level
|
|
classifier must support the following interface. The names will, of
|
|
course, be unique for each different matcher. Note also that
|
|
FEATURE_STRUCT is a data structure that is defined specifically for
|
|
each feature extractor/matcher pair.
|
|
|
|
void InitClassifier ();
|
|
|
|
void InitClassifierVars ();
|
|
|
|
int TweekClassifier (char *Params);
|
|
|
|
void InitQuickGuess (FEATURE_STRUCT *CharFeatures);
|
|
|
|
CLASS_ID NextQuickGuess ();
|
|
|
|
void MatchCharToClass (CLASS_ID
|
|
ClassID,
|
|
FEATURE_STRUCT
|
|
*CharFeatures,
|
|
MATCH_RESULT
|
|
*MatchResult);
|
|
|
|
void DebugMatch (CLASS_ID
|
|
ClassID,
|
|
FEATURE_STRUCT
|
|
*CharFeatures,
|
|
MATCH_RESULT
|
|
*MatchResult);
|
|
|
|
*/
|
|
|
|
/* misc test functions for proto id's and feature id's */
|
|
#define IsValidFeature(Fid) ((Fid) < MAX_FEATURE_ID)
|
|
#define IsValidProto(Pid) ((Pid) >= 0)
|
|
|
|
#if defined(__STDC__) || defined(__cplusplus)
|
|
# define _ARGS(s) s
|
|
#else
|
|
# define _ARGS(s) ()
|
|
#endif
|
|
|
|
/* matchdefs.c */
|
|
int CompareMatchResults
|
|
_ARGS ((MATCH_RESULT * Result1, MATCH_RESULT * Result2));
|
|
|
|
void PrintMatchResult _ARGS ((FILE * File, MATCH_RESULT * MatchResult));
|
|
|
|
void PrintMatchResults
|
|
_ARGS ((FILE * File, int N, MATCH_RESULT MatchResults[]));
|
|
|
|
#undef _ARGS
|
|
|
|
/**----------------------------------------------------------------------------
|
|
Global Data Definitions and Declarations
|
|
----------------------------------------------------------------------------**/
|
|
#endif
|