tesseract/ccmain/matmatch.cpp

397 lines
11 KiB
C++
Raw Normal View History

/**********************************************************************
* File: matmatch.cpp (Formerly matrix_match.c)
* Description: matrix matching routines for Tessedit
* Author: Chris Newton
* Created: Wed Nov 24 15:57:41 GMT 1993
*
* (C) Copyright 1993, Hewlett-Packard Ltd.
** Licensed under the Apache License, Version 2.0 (the "License");
** you may not use this file except in compliance with the License.
** You may obtain a copy of the License at
** http://www.apache.org/licenses/LICENSE-2.0
** Unless required by applicable law or agreed to in writing, software
** distributed under the License is distributed on an "AS IS" BASIS,
** WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
** See the License for the specific language governing permissions and
** limitations under the License.
*
**********************************************************************/
#include "mfcpch.h"
// Include automatically generated configuration file if running autoconf.
#ifdef HAVE_CONFIG_H
#include "config_auto.h"
#endif
#include <stdlib.h>
#include <math.h>
#include <string.h>
#include <ctype.h>
#ifdef __UNIX__
#include <assert.h>
#endif
#include "tessvars.h"
#include "stderr.h"
#include "img.h"
//#include "evnts.h"
//#include "showim.h"
#include "hosthplb.h"
#include "scrollview.h"
//#include "evnts.h"
#include "adaptions.h"
#include "matmatch.h"
#include "secname.h"
#include "svshowim.h"
#define EXTERN
EXTERN BOOL_VAR (tessedit_display_mm, FALSE, "Display matrix matches");
EXTERN BOOL_VAR (tessedit_mm_debug, FALSE,
"Print debug information for matrix matcher");
EXTERN INT_VAR (tessedit_mm_prototype_min_size, 3,
"Smallest number of samples in a cluster for a prototype to be used");
// Colours for displaying the match
#define BB_COLOUR 0
#define BW_COLOUR 1
#define WB_COLOUR 3
#define UB_COLOUR 5
#define BU_COLOUR 7
#define UU_COLOUR 9
#define WU_COLOUR 11
#define UW_COLOUR 13
#define WW_COLOUR 15
#define BINIM_BLACK 0
#define BINIM_WHITE 1
float matrix_match( // returns match score
IMAGE *image1,
IMAGE *image2) {
ASSERT_HOST (image1->get_bpp () == 1 && image2->get_bpp () == 1);
if (image1->get_xsize () >= image2->get_xsize ())
return match1 (image1, image2);
else
return match1 (image2, image1);
}
float match1( /* returns match score */
IMAGE *image_w,
IMAGE *image_n) {
inT32 x_offset;
inT32 y_offset;
inT32 x_size = image_w->get_xsize ();
inT32 y_size;
inT32 x_size2 = image_n->get_xsize ();
inT32 y_size2;
IMAGE match_image;
IMAGELINE imline_w;
IMAGELINE imline_n;
IMAGELINE match_imline;
inT32 x;
inT32 y;
float sum = 0.0;
x_offset = (image_w->get_xsize () - image_n->get_xsize ()) / 2;
ASSERT_HOST (x_offset >= 0);
match_imline.init (x_size);
sum = 0;
if (image_w->get_ysize () < image_n->get_ysize ()) {
y_size = image_n->get_ysize ();
y_size2 = image_w->get_ysize ();
y_offset = (y_size - y_size2) / 2;
if (tessedit_display_mm && !tessedit_mm_use_prototypes)
tprintf ("I1 (%d, %d), I2 (%d, %d), MI (%d, %d)\n", x_size,
image_w->get_ysize (), x_size2, image_n->get_ysize (),
x_size, y_size);
match_image.create (x_size, y_size, 4);
for (y = 0; y < y_offset; y++) {
image_n->fast_get_line (0, y, x_size2, &imline_n);
for (x = 0; x < x_size2; x++) {
if (imline_n.pixels[x] == BINIM_BLACK) {
sum += -1;
match_imline.pixels[x] = UB_COLOUR;
}
else {
match_imline.pixels[x] = UW_COLOUR;
}
}
match_image.fast_put_line (x_offset, y, x_size2, &match_imline);
}
for (y = y_offset + y_size2; y < y_size; y++) {
image_n->fast_get_line (0, y, x_size2, &imline_n);
for (x = 0; x < x_size2; x++) {
if (imline_n.pixels[x] == BINIM_BLACK) {
sum += -1.0;
match_imline.pixels[x] = UB_COLOUR;
}
else {
match_imline.pixels[x] = UW_COLOUR;
}
}
match_image.fast_put_line (x_offset, y, x_size2, &match_imline);
}
for (y = y_offset; y < y_offset + y_size2; y++) {
image_w->fast_get_line (0, y - y_offset, x_size, &imline_w);
image_n->fast_get_line (0, y, x_size2, &imline_n);
for (x = 0; x < x_offset; x++) {
if (imline_w.pixels[x] == BINIM_BLACK) {
sum += -1.0;
match_imline.pixels[x] = BU_COLOUR;
}
else {
match_imline.pixels[x] = WU_COLOUR;
}
}
for (x = x_offset + x_size2; x < x_size; x++) {
if (imline_w.pixels[x] == BINIM_BLACK) {
sum += -1.0;
match_imline.pixels[x] = BU_COLOUR;
}
else {
match_imline.pixels[x] = WU_COLOUR;
}
}
for (x = x_offset; x < x_offset + x_size2; x++) {
if (imline_n.pixels[x - x_offset] == imline_w.pixels[x]) {
sum += 1.0;
if (imline_w.pixels[x] == BINIM_BLACK)
match_imline.pixels[x] = BB_COLOUR;
else
match_imline.pixels[x] = WW_COLOUR;
}
else {
sum += -1.0;
if (imline_w.pixels[x] == BINIM_BLACK)
match_imline.pixels[x] = BW_COLOUR;
else
match_imline.pixels[x] = WB_COLOUR;
}
}
match_image.fast_put_line (0, y, x_size, &match_imline);
}
}
else {
y_size = image_w->get_ysize ();
y_size2 = image_n->get_ysize ();
y_offset = (y_size - y_size2) / 2;
if (tessedit_display_mm && !tessedit_mm_use_prototypes)
tprintf ("I1 (%d, %d), I2 (%d, %d), MI (%d, %d)\n", x_size,
image_w->get_ysize (), x_size2, image_n->get_ysize (),
x_size, y_size);
match_image.create (x_size, y_size, 4);
for (y = 0; y < y_offset; y++) {
image_w->fast_get_line (0, y, x_size, &imline_w);
for (x = 0; x < x_size; x++) {
if (imline_w.pixels[x] == BINIM_BLACK) {
sum += -1;
match_imline.pixels[x] = BU_COLOUR;
}
else {
match_imline.pixels[x] = WU_COLOUR;
}
}
match_image.fast_put_line (0, y, x_size, &match_imline);
}
for (y = y_offset + y_size2; y < y_size; y++) {
image_w->fast_get_line (0, y, x_size, &imline_w);
for (x = 0; x < x_size; x++) {
if (imline_w.pixels[x] == BINIM_BLACK) {
sum += -1;
match_imline.pixels[x] = BU_COLOUR;
}
else {
match_imline.pixels[x] = WU_COLOUR;
}
}
match_image.fast_put_line (0, y, x_size, &match_imline);
}
for (y = y_offset; y < y_offset + y_size2; y++) {
image_w->fast_get_line (0, y, x_size, &imline_w);
image_n->fast_get_line (0, y - y_offset, x_size2, &imline_n);
for (x = 0; x < x_offset; x++) {
if (imline_w.pixels[x] == BINIM_BLACK) {
sum += -1.0;
match_imline.pixels[x] = BU_COLOUR;
}
else {
match_imline.pixels[x] = WU_COLOUR;
}
}
for (x = x_offset + x_size2; x < x_size; x++) {
if (imline_w.pixels[x] == BINIM_BLACK) {
sum += -1.0;
match_imline.pixels[x] = BU_COLOUR;
}
else {
match_imline.pixels[x] = WU_COLOUR;
}
}
for (x = x_offset; x < x_offset + x_size2; x++) {
if (imline_n.pixels[x - x_offset] == imline_w.pixels[x]) {
sum += 1.0;
if (imline_w.pixels[x] == BINIM_BLACK)
match_imline.pixels[x] = BB_COLOUR;
else
match_imline.pixels[x] = WW_COLOUR;
}
else {
sum += -1.0;
if (imline_w.pixels[x] == BINIM_BLACK)
match_imline.pixels[x] = BW_COLOUR;
else
match_imline.pixels[x] = WB_COLOUR;
}
}
match_image.fast_put_line (0, y, x_size, &match_imline);
}
}
#ifndef GRAPHICS_DISABLED
if (tessedit_display_mm && !tessedit_mm_use_prototypes) {
tprintf ("Match score %f\n", 1.0 - sum / (x_size * y_size));
display_images(image_w, image_n, &match_image);
}
#endif
if (tessedit_mm_debug)
tprintf ("Match score %f\n", 1.0 - sum / (x_size * y_size));
return (1.0 - sum / (x_size * y_size));
}
/*************************************************************************
* display_images()
*
* Show a pair of images, plus the match image
*
*************************************************************************/
#ifndef GRAPHICS_DISABLED
void display_images(IMAGE *image_w, IMAGE *image_n, IMAGE *match_image) {
ScrollView* w_im_window;
ScrollView* n_im_window;
ScrollView* match_window;
inT16 i;
w_im_window = new ScrollView("Image 1", 20, 100,
10 * image_w->get_xsize (), 10 * image_w->get_ysize (),
image_w->get_xsize (), image_w->get_ysize ());
sv_show_sub_image (image_w,
0, 0,
image_w->get_xsize (), image_w->get_ysize (),
w_im_window, 0, 0);
w_im_window->Pen(255,0,0);
for (i = 1; i < image_w->get_xsize (); i++) {
w_im_window->Line(i, 0, i, image_w->get_ysize ());
}
for (i = 1; i < image_w->get_ysize (); i++) {
w_im_window->Line(0, i, image_w->get_xsize (), i);
}
n_im_window = new ScrollView ("Image 2", 240, 100,
10 * image_n->get_xsize (), 10 * image_n->get_ysize (),
image_n->get_xsize (), image_n->get_ysize ());
sv_show_sub_image (image_n,
0, 0,
image_n->get_xsize (), image_n->get_ysize (),
n_im_window, 0, 0);
n_im_window->Pen(255,0,0);
for (i = 1; i < image_n->get_xsize (); i++) {
n_im_window->Line(i, 0, i, image_n->get_ysize ());
}
for (i = 1; i < image_n->get_ysize (); i++) {
n_im_window->Line(0, i, image_n->get_xsize (), i);
}
match_window = new ScrollView ("Match Result", 460, 100,
10 * match_image->get_xsize (), 10 * match_image->get_ysize (),
match_image->get_xsize (), match_image->get_ysize ());
match_window->Clear();
sv_show_sub_image (match_image,
0, 0,
match_image->get_xsize (), match_image->get_ysize (),
match_window, 0, 0);
match_window->Pen(255,0,0);
for (i = 1; i < match_image->get_xsize (); i++) {
match_window->Line(i, 0, i, match_image->get_ysize ());
}
for (i = 1; i < match_image->get_ysize (); i++) {
match_window->Line(0, i, match_image->get_xsize (), i);
}
SVEvent* sve = match_window->AwaitEvent(SVET_DESTROY);
delete sve;
delete w_im_window;
delete n_im_window;
delete match_window;
}
/*************************************************************************
* display_image()
*
* Show a single image
*
*************************************************************************/
ScrollView* display_image(IMAGE *image,
const char *title,
inT32 x,
inT32 y,
BOOL8 wait) {
ScrollView* im_window;
inT16 i;
im_window = new ScrollView (title, x, y,
10 * image->get_xsize (), 10 * image->get_ysize (),
image->get_xsize (), image->get_ysize ());
sv_show_sub_image (image,
0, 0,
image->get_xsize (), image->get_ysize (), im_window, 0, 0);
im_window->Pen(255,0,0);
for (i = 1; i < image->get_xsize (); i++) {
im_window->SetCursor(i, 0);
im_window->DrawTo(i, image->get_ysize());
}
for (i = 1; i < image->get_ysize (); i++) {
im_window->SetCursor(0, i);
im_window->DrawTo(image->get_xsize(),i);
}
if (wait) { delete im_window->AwaitEvent(SVET_CLICK); }
return im_window;
}
#endif