mirror of
https://github.com/tesseract-ocr/tesseract.git
synced 2025-01-06 01:07:49 +08:00
425d593ebe
git-svn-id: https://tesseract-ocr.googlecode.com/svn/trunk/trunk@2 d0cd1f9f-072b-0410-8dd7-cf729c803f20
263 lines
8.8 KiB
C++
263 lines
8.8 KiB
C++
/**********************************************************************
|
|
* File: ratngs.cpp (Formerly ratings.c)
|
|
* Description: Code to manipulate the BLOB_CHOICE and WERD_CHOICE classes.
|
|
* Author: Ray Smith
|
|
* Created: Thu Apr 23 13:23:29 BST 1992
|
|
*
|
|
* (C) Copyright 1992, Hewlett-Packard Ltd.
|
|
** Licensed under the Apache License, Version 2.0 (the "License");
|
|
** you may not use this file except in compliance with the License.
|
|
** You may obtain a copy of the License at
|
|
** http://www.apache.org/licenses/LICENSE-2.0
|
|
** Unless required by applicable law or agreed to in writing, software
|
|
** distributed under the License is distributed on an "AS IS" BASIS,
|
|
** WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
** See the License for the specific language governing permissions and
|
|
** limitations under the License.
|
|
*
|
|
**********************************************************************/
|
|
|
|
#include "mfcpch.h"
|
|
//#include "ipeerr.h"
|
|
#include "callcpp.h"
|
|
#include "ratngs.h"
|
|
//#include "tordvars.h"
|
|
extern FILE *matcher_fp;
|
|
|
|
ELISTIZE (BLOB_CHOICE) CLISTIZE (BLOB_CHOICE_LIST) CLISTIZE (WERD_CHOICE)
|
|
//extern FILE* matcher_fp;
|
|
/**********************************************************************
|
|
* BLOB_CHOICE::BLOB_CHOICE
|
|
*
|
|
* Constructor to build a BLOB_CHOICE from a char, rating and certainty.
|
|
**********************************************************************/
|
|
BLOB_CHOICE::BLOB_CHOICE( //constructor
|
|
char src_class, //character
|
|
float src_rating, //rating
|
|
float src_cert, //certainty
|
|
INT8 src_config //config (font)
|
|
) {
|
|
blob_class = src_class;
|
|
blob_rating = src_rating;
|
|
blob_certainty = src_cert; //just copy them
|
|
blob_config = src_config;
|
|
}
|
|
|
|
|
|
/**********************************************************************
|
|
* WERD_CHOICE::WERD_CHOICE
|
|
*
|
|
* Constructor to build a WERD_CHOICE from a char, rating and certainty.
|
|
**********************************************************************/
|
|
|
|
WERD_CHOICE::WERD_CHOICE (
|
|
//constructor
|
|
const char *src_string, //word string
|
|
float src_rating, //rating
|
|
float src_cert, //certainty
|
|
UINT8 src_permuter //permuter code
|
|
):
|
|
word_string(src_string) {
|
|
word_rating = src_rating;
|
|
word_certainty = src_cert;
|
|
word_permuter = src_permuter; //just copy them
|
|
}
|
|
|
|
|
|
/**********************************************************************
|
|
* WERD_CHOICE::operator+=
|
|
*
|
|
* Cat a second word rating on the end of this current one.
|
|
* The ratings are added and the confidence is the min.
|
|
* If the permuters are NOT the same the permuter is set to COMPOUND_PERM
|
|
**********************************************************************/
|
|
|
|
//add one on
|
|
WERD_CHOICE & WERD_CHOICE::operator+= (
|
|
const WERD_CHOICE & second //second word
|
|
) {
|
|
if (word_string.length () == 0 || second.word_string.length () == 0) {
|
|
word_string = NULL; //make it empty
|
|
}
|
|
else {
|
|
//add ratings
|
|
word_rating += second.word_rating;
|
|
if (second.word_certainty < word_certainty)
|
|
//take min
|
|
word_certainty = second.word_certainty;
|
|
//cat strings
|
|
word_string += second.word_string;
|
|
if (second.word_permuter != word_permuter)
|
|
word_permuter = COMPOUND_PERM;
|
|
}
|
|
|
|
return *this;
|
|
}
|
|
|
|
|
|
/**********************************************************************
|
|
* print_ratings_list
|
|
*
|
|
* Send all the ratings out to the logfile.
|
|
**********************************************************************/
|
|
|
|
void print_ratings_list( //print whole list
|
|
const char *msg, //intro message
|
|
BLOB_CHOICE_LIST *ratings //list of results
|
|
) {
|
|
BLOB_CHOICE_IT
|
|
c_it = ratings; //iterator
|
|
|
|
switch (ratings->length ()) {
|
|
case 0:
|
|
tprintf ("%s:<none>", msg);
|
|
break;
|
|
case 1:
|
|
tprintf ("%s:%c/%g/%g", msg,
|
|
c_it.data ()->char_class (),
|
|
c_it.data ()->rating (), c_it.data ()->certainty ());
|
|
break;
|
|
case 2:
|
|
tprintf ("%s:%c/%g/%g %c/%g/%g", msg,
|
|
c_it.data ()->char_class (),
|
|
c_it.data ()->rating (),
|
|
c_it.data ()->certainty (),
|
|
c_it.data_relative (1)->char_class (),
|
|
c_it.data_relative (1)->rating (),
|
|
c_it.data_relative (1)->certainty ());
|
|
break;
|
|
case 3:
|
|
tprintf ("%s:%c/%g/%g %c/%g/%g %c/%g/%g", msg,
|
|
c_it.data ()->char_class (),
|
|
c_it.data ()->rating (),
|
|
c_it.data ()->certainty (),
|
|
c_it.data_relative (1)->char_class (),
|
|
c_it.data_relative (1)->rating (),
|
|
c_it.data_relative (1)->certainty (),
|
|
c_it.data_relative (2)->char_class (),
|
|
c_it.data_relative (2)->rating (),
|
|
c_it.data_relative (2)->certainty ());
|
|
break;
|
|
case 4:
|
|
tprintf ("%s:%c/%g/%g %c/%g/%g %c/%g/%g %c/%g/%g", msg,
|
|
c_it.data ()->char_class (),
|
|
c_it.data ()->rating (),
|
|
c_it.data ()->certainty (),
|
|
c_it.data_relative (1)->char_class (),
|
|
c_it.data_relative (1)->rating (),
|
|
c_it.data_relative (1)->certainty (),
|
|
c_it.data_relative (2)->char_class (),
|
|
c_it.data_relative (2)->rating (),
|
|
c_it.data_relative (2)->certainty (),
|
|
c_it.data_relative (3)->char_class (),
|
|
c_it.data_relative (3)->rating (),
|
|
c_it.data_relative (3)->certainty ());
|
|
break;
|
|
default:
|
|
tprintf ("%s:%c/%g/%g %c/%g/%g %c/%g/%g %c/%g/%g %c/%g/%g", msg,
|
|
c_it.data ()->char_class (),
|
|
c_it.data ()->rating (),
|
|
c_it.data ()->certainty (),
|
|
c_it.data_relative (1)->char_class (),
|
|
c_it.data_relative (1)->rating (),
|
|
c_it.data_relative (1)->certainty (),
|
|
c_it.data_relative (2)->char_class (),
|
|
c_it.data_relative (2)->rating (),
|
|
c_it.data_relative (2)->certainty (),
|
|
c_it.data_relative (3)->char_class (),
|
|
c_it.data_relative (3)->rating (),
|
|
c_it.data_relative (3)->certainty (),
|
|
c_it.data_relative (4)->char_class (),
|
|
c_it.data_relative (4)->rating (),
|
|
c_it.data_relative (4)->certainty ());
|
|
c_it.forward ();
|
|
c_it.forward ();
|
|
c_it.forward ();
|
|
c_it.forward ();
|
|
while (!c_it.at_last ()) {
|
|
c_it.forward ();
|
|
tprintf ("%c/%g/%g",
|
|
c_it.data ()->char_class (),
|
|
c_it.data ()->rating (), c_it.data ()->certainty ());
|
|
}
|
|
|
|
break;
|
|
}
|
|
}
|
|
|
|
|
|
/**********************************************************************
|
|
* print_ratings_info
|
|
*
|
|
* Send all the ratings out to the logfile.
|
|
**********************************************************************/
|
|
|
|
void print_ratings_info( //print summary info
|
|
FILE *fp, //file to use
|
|
BLOB_CHOICE_LIST *ratings //list of results
|
|
) {
|
|
INT32
|
|
index; //to list
|
|
INT32
|
|
best_index; //to list
|
|
FLOAT32
|
|
best_rat; //rating
|
|
FLOAT32
|
|
best_cert; //certainty
|
|
char
|
|
first_char; //character
|
|
FLOAT32
|
|
first_rat; //rating
|
|
FLOAT32
|
|
first_cert; //certainty
|
|
char
|
|
sec_char = 0; //character
|
|
FLOAT32
|
|
sec_rat = 0.0f; //rating
|
|
FLOAT32
|
|
sec_cert = 0.0f; //certainty
|
|
BLOB_CHOICE_IT
|
|
c_it = ratings; //iterator
|
|
|
|
index = ratings->length ();
|
|
if (index > 0) {
|
|
first_char = c_it.data ()->char_class ();
|
|
first_rat = c_it.data ()->rating ();
|
|
first_cert = -c_it.data ()->certainty ();
|
|
if (index > 1) {
|
|
sec_char = c_it.data_relative (1)->char_class ();
|
|
sec_rat = c_it.data_relative (1)->rating ();
|
|
sec_cert = -c_it.data_relative (1)->certainty ();
|
|
}
|
|
else {
|
|
sec_char = '~';
|
|
sec_rat = -1;
|
|
sec_cert = -1;
|
|
}
|
|
}
|
|
else {
|
|
first_char = '~';
|
|
first_rat = -1;
|
|
first_cert = -1;
|
|
}
|
|
best_index = -1;
|
|
best_rat = -1;
|
|
best_cert = -1;
|
|
for (index = 0, c_it.mark_cycle_pt (); !c_it.cycled_list ();
|
|
c_it.forward (), index++) {
|
|
if (c_it.data ()->char_class () == blob_answer) {
|
|
best_index = index;
|
|
best_rat = c_it.data ()->rating ();
|
|
best_cert = -c_it.data ()->certainty ();
|
|
}
|
|
}
|
|
if (first_char == '\0' || first_char == ' ')
|
|
first_char = '~';
|
|
if (sec_char == '\0' || sec_char == ' ')
|
|
sec_char = '~';
|
|
fprintf (matcher_fp,
|
|
" " INT32FORMAT " " INT32FORMAT " %g %g %c %g %g %c %g %g\n",
|
|
ratings->length (), best_index, best_rat, best_cert, first_char,
|
|
first_rat, first_cert, sec_char, sec_rat, sec_cert);
|
|
}
|