mirror of
https://github.com/tesseract-ocr/tesseract.git
synced 2025-01-22 09:53:03 +08:00
10c1169d98
git-svn-id: https://tesseract-ocr.googlecode.com/svn/trunk@860 d0cd1f9f-072b-0410-8dd7-cf729c803f20
696 lines
26 KiB
C++
696 lines
26 KiB
C++
/**********************************************************************
|
|
* File: pithsync.cpp (Formerly pitsync2.c)
|
|
* Description: Code to find the optimum fixed pitch segmentation of some blobs.
|
|
* Author: Ray Smith
|
|
* Created: Thu Nov 19 11:48:05 GMT 1992
|
|
*
|
|
* (C) Copyright 1992, Hewlett-Packard Ltd.
|
|
** Licensed under the Apache License, Version 2.0 (the "License");
|
|
** you may not use this file except in compliance with the License.
|
|
** You may obtain a copy of the License at
|
|
** http://www.apache.org/licenses/LICENSE-2.0
|
|
** Unless required by applicable law or agreed to in writing, software
|
|
** distributed under the License is distributed on an "AS IS" BASIS,
|
|
** WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
** See the License for the specific language governing permissions and
|
|
** limitations under the License.
|
|
*
|
|
**********************************************************************/
|
|
|
|
#ifdef __UNIX__
|
|
#include <assert.h>
|
|
#endif
|
|
#include <math.h>
|
|
#include "memry.h"
|
|
#include "makerow.h"
|
|
#include "pitsync1.h"
|
|
#include "topitch.h"
|
|
#include "pithsync.h"
|
|
#include "tprintf.h"
|
|
|
|
#define PROJECTION_MARGIN 10 //arbitrary
|
|
|
|
#define EXTERN
|
|
|
|
/**********************************************************************
|
|
* FPCUTPT::setup
|
|
*
|
|
* Constructor to make a new FPCUTPT.
|
|
**********************************************************************/
|
|
|
|
void FPCUTPT::setup( //constructor
|
|
FPCUTPT *cutpts, //predecessors
|
|
inT16 array_origin, //start coord
|
|
STATS *projection, //vertical occupation
|
|
inT16 zero_count, //official zero
|
|
inT16 pitch, //proposed pitch
|
|
inT16 x, //position
|
|
inT16 offset //dist to gap
|
|
) {
|
|
//half of pitch
|
|
inT16 half_pitch = pitch / 2 - 1;
|
|
uinT32 lead_flag; //new flag
|
|
inT32 ind; //current position
|
|
|
|
if (half_pitch > 31)
|
|
half_pitch = 31;
|
|
else if (half_pitch < 0)
|
|
half_pitch = 0;
|
|
lead_flag = 1 << half_pitch;
|
|
|
|
pred = NULL;
|
|
mean_sum = 0;
|
|
sq_sum = offset * offset;
|
|
cost = sq_sum;
|
|
faked = FALSE;
|
|
terminal = FALSE;
|
|
fake_count = 0;
|
|
xpos = x;
|
|
region_index = 0;
|
|
mid_cuts = 0;
|
|
if (x == array_origin) {
|
|
back_balance = 0;
|
|
fwd_balance = 0;
|
|
for (ind = 0; ind <= half_pitch; ind++) {
|
|
fwd_balance >>= 1;
|
|
if (projection->pile_count (ind) > zero_count)
|
|
fwd_balance |= lead_flag;
|
|
}
|
|
}
|
|
else {
|
|
back_balance = cutpts[x - 1 - array_origin].back_balance << 1;
|
|
back_balance &= lead_flag + lead_flag - 1;
|
|
if (projection->pile_count (x) > zero_count)
|
|
back_balance |= 1;
|
|
fwd_balance = cutpts[x - 1 - array_origin].fwd_balance >> 1;
|
|
if (projection->pile_count (x + half_pitch) > zero_count)
|
|
fwd_balance |= lead_flag;
|
|
}
|
|
}
|
|
|
|
|
|
/**********************************************************************
|
|
* FPCUTPT::assign
|
|
*
|
|
* Constructor to make a new FPCUTPT.
|
|
**********************************************************************/
|
|
|
|
void FPCUTPT::assign( //constructor
|
|
FPCUTPT *cutpts, //predecessors
|
|
inT16 array_origin, //start coord
|
|
inT16 x, //position
|
|
BOOL8 faking, //faking this one
|
|
BOOL8 mid_cut, //cheap cut.
|
|
inT16 offset, //dist to gap
|
|
STATS *projection, //vertical occupation
|
|
float projection_scale, //scaling
|
|
inT16 zero_count, //official zero
|
|
inT16 pitch, //proposed pitch
|
|
inT16 pitch_error //allowed tolerance
|
|
) {
|
|
int index; //test index
|
|
int balance_index; //for balance factor
|
|
inT16 balance_count; //ding factor
|
|
inT16 r_index; //test cut number
|
|
FPCUTPT *segpt; //segment point
|
|
inT32 dist; //from prev segment
|
|
double sq_dist; //squared distance
|
|
double mean; //mean pitch
|
|
double total; //total dists
|
|
double factor; //cost function
|
|
//half of pitch
|
|
inT16 half_pitch = pitch / 2 - 1;
|
|
uinT32 lead_flag; //new flag
|
|
|
|
if (half_pitch > 31)
|
|
half_pitch = 31;
|
|
else if (half_pitch < 0)
|
|
half_pitch = 0;
|
|
lead_flag = 1 << half_pitch;
|
|
|
|
back_balance = cutpts[x - 1 - array_origin].back_balance << 1;
|
|
back_balance &= lead_flag + lead_flag - 1;
|
|
if (projection->pile_count (x) > zero_count)
|
|
back_balance |= 1;
|
|
fwd_balance = cutpts[x - 1 - array_origin].fwd_balance >> 1;
|
|
if (projection->pile_count (x + half_pitch) > zero_count)
|
|
fwd_balance |= lead_flag;
|
|
|
|
xpos = x;
|
|
cost = MAX_FLOAT32;
|
|
pred = NULL;
|
|
faked = faking;
|
|
terminal = FALSE;
|
|
region_index = 0;
|
|
fake_count = MAX_INT16;
|
|
for (index = x - pitch - pitch_error; index <= x - pitch + pitch_error;
|
|
index++) {
|
|
if (index >= array_origin) {
|
|
segpt = &cutpts[index - array_origin];
|
|
dist = x - segpt->xpos;
|
|
if (!segpt->terminal && segpt->fake_count < MAX_INT16) {
|
|
balance_count = 0;
|
|
if (textord_balance_factor > 0) {
|
|
if (textord_fast_pitch_test) {
|
|
lead_flag = back_balance ^ segpt->fwd_balance;
|
|
balance_count = 0;
|
|
while (lead_flag != 0) {
|
|
balance_count++;
|
|
lead_flag &= lead_flag - 1;
|
|
}
|
|
}
|
|
else {
|
|
for (balance_index = 0;
|
|
index + balance_index < x - balance_index;
|
|
balance_index++)
|
|
balance_count +=
|
|
(projection->pile_count (index + balance_index) <=
|
|
zero_count) ^ (projection->pile_count (x -
|
|
balance_index)
|
|
<= zero_count);
|
|
}
|
|
balance_count =
|
|
(inT16) (balance_count * textord_balance_factor /
|
|
projection_scale);
|
|
}
|
|
r_index = segpt->region_index + 1;
|
|
total = segpt->mean_sum + dist;
|
|
balance_count += offset;
|
|
sq_dist =
|
|
dist * dist + segpt->sq_sum + balance_count * balance_count;
|
|
mean = total / r_index;
|
|
factor = mean - pitch;
|
|
factor *= factor;
|
|
factor += sq_dist / (r_index) - mean * mean;
|
|
if (factor < cost && segpt->fake_count + faked <= fake_count) {
|
|
cost = factor; //find least cost
|
|
pred = segpt; //save path
|
|
mean_sum = total;
|
|
sq_sum = sq_dist;
|
|
fake_count = segpt->fake_count + faked;
|
|
mid_cuts = segpt->mid_cuts + mid_cut;
|
|
region_index = r_index;
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
|
|
/**********************************************************************
|
|
* FPCUTPT::assign_cheap
|
|
*
|
|
* Constructor to make a new FPCUTPT on the cheap.
|
|
**********************************************************************/
|
|
|
|
void FPCUTPT::assign_cheap( //constructor
|
|
FPCUTPT *cutpts, //predecessors
|
|
inT16 array_origin, //start coord
|
|
inT16 x, //position
|
|
BOOL8 faking, //faking this one
|
|
BOOL8 mid_cut, //cheap cut.
|
|
inT16 offset, //dist to gap
|
|
STATS *projection, //vertical occupation
|
|
float projection_scale, //scaling
|
|
inT16 zero_count, //official zero
|
|
inT16 pitch, //proposed pitch
|
|
inT16 pitch_error //allowed tolerance
|
|
) {
|
|
int index; //test index
|
|
inT16 balance_count; //ding factor
|
|
inT16 r_index; //test cut number
|
|
FPCUTPT *segpt; //segment point
|
|
inT32 dist; //from prev segment
|
|
double sq_dist; //squared distance
|
|
double mean; //mean pitch
|
|
double total; //total dists
|
|
double factor; //cost function
|
|
//half of pitch
|
|
inT16 half_pitch = pitch / 2 - 1;
|
|
uinT32 lead_flag; //new flag
|
|
|
|
if (half_pitch > 31)
|
|
half_pitch = 31;
|
|
else if (half_pitch < 0)
|
|
half_pitch = 0;
|
|
lead_flag = 1 << half_pitch;
|
|
|
|
back_balance = cutpts[x - 1 - array_origin].back_balance << 1;
|
|
back_balance &= lead_flag + lead_flag - 1;
|
|
if (projection->pile_count (x) > zero_count)
|
|
back_balance |= 1;
|
|
fwd_balance = cutpts[x - 1 - array_origin].fwd_balance >> 1;
|
|
if (projection->pile_count (x + half_pitch) > zero_count)
|
|
fwd_balance |= lead_flag;
|
|
|
|
xpos = x;
|
|
cost = MAX_FLOAT32;
|
|
pred = NULL;
|
|
faked = faking;
|
|
terminal = FALSE;
|
|
region_index = 0;
|
|
fake_count = MAX_INT16;
|
|
index = x - pitch;
|
|
if (index >= array_origin) {
|
|
segpt = &cutpts[index - array_origin];
|
|
dist = x - segpt->xpos;
|
|
if (!segpt->terminal && segpt->fake_count < MAX_INT16) {
|
|
balance_count = 0;
|
|
if (textord_balance_factor > 0) {
|
|
lead_flag = back_balance ^ segpt->fwd_balance;
|
|
balance_count = 0;
|
|
while (lead_flag != 0) {
|
|
balance_count++;
|
|
lead_flag &= lead_flag - 1;
|
|
}
|
|
balance_count = (inT16) (balance_count * textord_balance_factor
|
|
/ projection_scale);
|
|
}
|
|
r_index = segpt->region_index + 1;
|
|
total = segpt->mean_sum + dist;
|
|
balance_count += offset;
|
|
sq_dist =
|
|
dist * dist + segpt->sq_sum + balance_count * balance_count;
|
|
mean = total / r_index;
|
|
factor = mean - pitch;
|
|
factor *= factor;
|
|
factor += sq_dist / (r_index) - mean * mean;
|
|
cost = factor; //find least cost
|
|
pred = segpt; //save path
|
|
mean_sum = total;
|
|
sq_sum = sq_dist;
|
|
fake_count = segpt->fake_count + faked;
|
|
mid_cuts = segpt->mid_cuts + mid_cut;
|
|
region_index = r_index;
|
|
}
|
|
}
|
|
}
|
|
|
|
|
|
/**********************************************************************
|
|
* check_pitch_sync
|
|
*
|
|
* Construct the lattice of possible segmentation points and choose the
|
|
* optimal path. Return the optimal path only.
|
|
* The return value is a measure of goodness of the sync.
|
|
**********************************************************************/
|
|
|
|
double check_pitch_sync2( //find segmentation
|
|
BLOBNBOX_IT *blob_it, //blobs to do
|
|
inT16 blob_count, //no of blobs
|
|
inT16 pitch, //pitch estimate
|
|
inT16 pitch_error, //tolerance
|
|
STATS *projection, //vertical
|
|
inT16 projection_left, //edges //scale factor
|
|
inT16 projection_right,
|
|
float projection_scale,
|
|
inT16 &occupation_count, //no of occupied cells
|
|
FPSEGPT_LIST *seg_list, //output list
|
|
inT16 start, //start of good range
|
|
inT16 end //end of good range
|
|
) {
|
|
BOOL8 faking; //illegal cut pt
|
|
BOOL8 mid_cut; //cheap cut pt.
|
|
inT16 x; //current coord
|
|
inT16 blob_index; //blob number
|
|
inT16 left_edge; //of word
|
|
inT16 right_edge; //of word
|
|
inT16 array_origin; //x coord of array
|
|
inT16 offset; //dist to legal area
|
|
inT16 zero_count; //projection zero
|
|
inT16 best_left_x = 0; //for equals
|
|
inT16 best_right_x = 0; //right edge
|
|
TBOX this_box; //bounding box
|
|
TBOX next_box; //box of next blob
|
|
FPSEGPT *segpt; //segment point
|
|
FPCUTPT *cutpts; //array of points
|
|
double best_cost; //best path
|
|
double mean_sum; //computes result
|
|
FPCUTPT *best_end; //end of best path
|
|
inT16 best_fake; //best fake level
|
|
inT16 best_count; //no of cuts
|
|
BLOBNBOX_IT this_it; //copy iterator
|
|
FPSEGPT_IT seg_it = seg_list; //output iterator
|
|
|
|
// tprintf("Computing sync on word of %d blobs with pitch %d\n",
|
|
// blob_count, pitch);
|
|
// if (blob_count==8 && pitch==27)
|
|
// projection->print(stdout,TRUE);
|
|
zero_count = 0;
|
|
if (pitch < 3)
|
|
pitch = 3; //nothing ludicrous
|
|
if ((pitch - 3) / 2 < pitch_error)
|
|
pitch_error = (pitch - 3) / 2;
|
|
this_it = *blob_it;
|
|
this_box = box_next (&this_it);//get box
|
|
// left_edge=this_box.left(); //left of word
|
|
// right_edge=this_box.right();
|
|
// for (blob_index=1;blob_index<blob_count;blob_index++)
|
|
// {
|
|
// this_box=box_next(&this_it);
|
|
// if (this_box.right()>right_edge)
|
|
// right_edge=this_box.right();
|
|
// }
|
|
for (left_edge = projection_left; projection->pile_count (left_edge) == 0
|
|
&& left_edge < projection_right; left_edge++);
|
|
for (right_edge = projection_right; projection->pile_count (right_edge) == 0
|
|
&& right_edge > left_edge; right_edge--);
|
|
ASSERT_HOST (right_edge >= left_edge);
|
|
if (pitsync_linear_version >= 4)
|
|
return check_pitch_sync3 (projection_left, projection_right, zero_count,
|
|
pitch, pitch_error, projection,
|
|
projection_scale, occupation_count, seg_list,
|
|
start, end);
|
|
array_origin = left_edge - pitch;
|
|
cutpts = (FPCUTPT *) alloc_mem ((right_edge - left_edge + pitch * 2 + 1)
|
|
* sizeof (FPCUTPT));
|
|
for (x = array_origin; x < left_edge; x++)
|
|
//free cuts
|
|
cutpts[x - array_origin].setup (cutpts, array_origin, projection, zero_count, pitch, x, 0);
|
|
for (offset = 0; offset <= pitch_error; offset++, x++)
|
|
//not quite free
|
|
cutpts[x - array_origin].setup (cutpts, array_origin, projection, zero_count, pitch, x, offset);
|
|
|
|
this_it = *blob_it;
|
|
best_cost = MAX_FLOAT32;
|
|
best_end = NULL;
|
|
this_box = box_next (&this_it);//first box
|
|
next_box = box_next (&this_it);//second box
|
|
blob_index = 1;
|
|
while (x < right_edge - pitch_error) {
|
|
if (x > this_box.right () + pitch_error && blob_index < blob_count) {
|
|
this_box = next_box;
|
|
next_box = box_next (&this_it);
|
|
blob_index++;
|
|
}
|
|
faking = FALSE;
|
|
mid_cut = FALSE;
|
|
if (x <= this_box.left ())
|
|
offset = 0;
|
|
else if (x <= this_box.left () + pitch_error)
|
|
offset = x - this_box.left ();
|
|
else if (x >= this_box.right ())
|
|
offset = 0;
|
|
else if (x >= next_box.left () && blob_index < blob_count) {
|
|
offset = x - next_box.left ();
|
|
if (this_box.right () - x < offset)
|
|
offset = this_box.right () - x;
|
|
}
|
|
else if (x >= this_box.right () - pitch_error)
|
|
offset = this_box.right () - x;
|
|
else if (x - this_box.left () > pitch * pitsync_joined_edge
|
|
&& this_box.right () - x > pitch * pitsync_joined_edge) {
|
|
mid_cut = TRUE;
|
|
offset = 0;
|
|
}
|
|
else {
|
|
faking = TRUE;
|
|
offset = projection->pile_count (x);
|
|
}
|
|
cutpts[x - array_origin].assign (cutpts, array_origin, x,
|
|
faking, mid_cut, offset, projection,
|
|
projection_scale, zero_count, pitch,
|
|
pitch_error);
|
|
x++;
|
|
}
|
|
|
|
best_fake = MAX_INT16;
|
|
best_cost = MAX_INT32;
|
|
best_count = MAX_INT16;
|
|
while (x < right_edge + pitch) {
|
|
offset = x < right_edge ? right_edge - x : 0;
|
|
cutpts[x - array_origin].assign (cutpts, array_origin, x,
|
|
FALSE, FALSE, offset, projection,
|
|
projection_scale, zero_count, pitch,
|
|
pitch_error);
|
|
cutpts[x - array_origin].terminal = TRUE;
|
|
if (cutpts[x - array_origin].index () +
|
|
cutpts[x - array_origin].fake_count <= best_count + best_fake) {
|
|
if (cutpts[x - array_origin].fake_count < best_fake
|
|
|| (cutpts[x - array_origin].fake_count == best_fake
|
|
&& cutpts[x - array_origin].cost_function () < best_cost)) {
|
|
best_fake = cutpts[x - array_origin].fake_count;
|
|
best_cost = cutpts[x - array_origin].cost_function ();
|
|
best_left_x = x;
|
|
best_right_x = x;
|
|
best_count = cutpts[x - array_origin].index ();
|
|
}
|
|
else if (cutpts[x - array_origin].fake_count == best_fake
|
|
&& x == best_right_x + 1
|
|
&& cutpts[x - array_origin].cost_function () == best_cost) {
|
|
//exactly equal
|
|
best_right_x = x;
|
|
}
|
|
}
|
|
x++;
|
|
}
|
|
ASSERT_HOST (best_fake < MAX_INT16);
|
|
|
|
best_end = &cutpts[(best_left_x + best_right_x) / 2 - array_origin];
|
|
if (this_box.right () == textord_test_x
|
|
&& this_box.top () == textord_test_y) {
|
|
for (x = left_edge - pitch; x < right_edge + pitch; x++) {
|
|
tprintf ("x=%d, C=%g, s=%g, sq=%g, prev=%d\n",
|
|
x, cutpts[x - array_origin].cost_function (),
|
|
cutpts[x - array_origin].sum (),
|
|
cutpts[x - array_origin].squares (),
|
|
cutpts[x - array_origin].previous ()->position ());
|
|
}
|
|
}
|
|
occupation_count = -1;
|
|
do {
|
|
for (x = best_end->position () - pitch + pitch_error;
|
|
x < best_end->position () - pitch_error
|
|
&& projection->pile_count (x) == 0; x++);
|
|
if (x < best_end->position () - pitch_error)
|
|
occupation_count++;
|
|
//copy it
|
|
segpt = new FPSEGPT (best_end);
|
|
seg_it.add_before_then_move (segpt);
|
|
best_end = best_end->previous ();
|
|
}
|
|
while (best_end != NULL);
|
|
seg_it.move_to_last ();
|
|
mean_sum = seg_it.data ()->sum ();
|
|
mean_sum = mean_sum * mean_sum / best_count;
|
|
if (seg_it.data ()->squares () - mean_sum < 0)
|
|
tprintf ("Impossible sqsum=%g, mean=%g, total=%d\n",
|
|
seg_it.data ()->squares (), seg_it.data ()->sum (), best_count);
|
|
free_mem(cutpts);
|
|
// tprintf("blob_count=%d, pitch=%d, sync=%g, occ=%d\n",
|
|
// blob_count,pitch,seg_it.data()->squares()-mean_sum,
|
|
// occupation_count);
|
|
return seg_it.data ()->squares () - mean_sum;
|
|
}
|
|
|
|
|
|
/**********************************************************************
|
|
* check_pitch_sync
|
|
*
|
|
* Construct the lattice of possible segmentation points and choose the
|
|
* optimal path. Return the optimal path only.
|
|
* The return value is a measure of goodness of the sync.
|
|
**********************************************************************/
|
|
|
|
double check_pitch_sync3( //find segmentation
|
|
inT16 projection_left, //edges //to be considered 0
|
|
inT16 projection_right,
|
|
inT16 zero_count,
|
|
inT16 pitch, //pitch estimate
|
|
inT16 pitch_error, //tolerance
|
|
STATS *projection, //vertical
|
|
float projection_scale, //scale factor
|
|
inT16 &occupation_count, //no of occupied cells
|
|
FPSEGPT_LIST *seg_list, //output list
|
|
inT16 start, //start of good range
|
|
inT16 end //end of good range
|
|
) {
|
|
BOOL8 faking; //illegal cut pt
|
|
BOOL8 mid_cut; //cheap cut pt.
|
|
inT16 left_edge; //of word
|
|
inT16 right_edge; //of word
|
|
inT16 x; //current coord
|
|
inT16 array_origin; //x coord of array
|
|
inT16 offset; //dist to legal area
|
|
inT16 projection_offset; //from scaled projection
|
|
inT16 prev_zero; //previous zero dist
|
|
inT16 next_zero; //next zero dist
|
|
inT16 zero_offset; //scan window
|
|
inT16 best_left_x = 0; //for equals
|
|
inT16 best_right_x = 0; //right edge
|
|
FPSEGPT *segpt; //segment point
|
|
FPCUTPT *cutpts; //array of points
|
|
BOOL8 *mins; //local min results
|
|
int minindex; //next input position
|
|
int test_index; //index to mins
|
|
double best_cost; //best path
|
|
double mean_sum; //computes result
|
|
FPCUTPT *best_end; //end of best path
|
|
inT16 best_fake; //best fake level
|
|
inT16 best_count; //no of cuts
|
|
FPSEGPT_IT seg_it = seg_list; //output iterator
|
|
|
|
end = (end - start) % pitch;
|
|
if (pitch < 3)
|
|
pitch = 3; //nothing ludicrous
|
|
if ((pitch - 3) / 2 < pitch_error)
|
|
pitch_error = (pitch - 3) / 2;
|
|
//min dist of zero
|
|
zero_offset = (inT16) (pitch * pitsync_joined_edge);
|
|
for (left_edge = projection_left; projection->pile_count (left_edge) == 0
|
|
&& left_edge < projection_right; left_edge++);
|
|
for (right_edge = projection_right; projection->pile_count (right_edge) == 0
|
|
&& right_edge > left_edge; right_edge--);
|
|
array_origin = left_edge - pitch;
|
|
cutpts = (FPCUTPT *) alloc_mem ((right_edge - left_edge + pitch * 2 + 1)
|
|
* sizeof (FPCUTPT));
|
|
mins = (BOOL8 *) alloc_mem ((pitch_error * 2 + 1) * sizeof (BOOL8));
|
|
for (x = array_origin; x < left_edge; x++)
|
|
//free cuts
|
|
cutpts[x - array_origin].setup (cutpts, array_origin, projection, zero_count, pitch, x, 0);
|
|
prev_zero = left_edge - 1;
|
|
for (offset = 0; offset <= pitch_error; offset++, x++)
|
|
//not quite free
|
|
cutpts[x - array_origin].setup (cutpts, array_origin, projection, zero_count, pitch, x, offset);
|
|
|
|
best_cost = MAX_FLOAT32;
|
|
best_end = NULL;
|
|
for (offset = -pitch_error, minindex = 0; offset < pitch_error;
|
|
offset++, minindex++)
|
|
mins[minindex] = projection->local_min (x + offset);
|
|
next_zero = x + zero_offset + 1;
|
|
for (offset = next_zero - 1; offset >= x; offset--) {
|
|
if (projection->pile_count (offset) <= zero_count) {
|
|
next_zero = offset;
|
|
break;
|
|
}
|
|
}
|
|
while (x < right_edge - pitch_error) {
|
|
mins[minindex] = projection->local_min (x + pitch_error);
|
|
minindex++;
|
|
if (minindex > pitch_error * 2)
|
|
minindex = 0;
|
|
faking = FALSE;
|
|
mid_cut = FALSE;
|
|
offset = 0;
|
|
if (projection->pile_count (x) <= zero_count) {
|
|
prev_zero = x;
|
|
}
|
|
else {
|
|
for (offset = 1; offset <= pitch_error; offset++)
|
|
if (projection->pile_count (x + offset) <= zero_count
|
|
|| projection->pile_count (x - offset) <= zero_count)
|
|
break;
|
|
}
|
|
if (offset > pitch_error) {
|
|
if (x - prev_zero > zero_offset && next_zero - x > zero_offset) {
|
|
for (offset = 0; offset <= pitch_error; offset++) {
|
|
test_index = minindex + pitch_error + offset;
|
|
if (test_index > pitch_error * 2)
|
|
test_index -= pitch_error * 2 + 1;
|
|
if (mins[test_index])
|
|
break;
|
|
test_index = minindex + pitch_error - offset;
|
|
if (test_index > pitch_error * 2)
|
|
test_index -= pitch_error * 2 + 1;
|
|
if (mins[test_index])
|
|
break;
|
|
}
|
|
}
|
|
if (offset > pitch_error) {
|
|
offset = projection->pile_count (x);
|
|
faking = TRUE;
|
|
}
|
|
else {
|
|
projection_offset =
|
|
(inT16) (projection->pile_count (x) / projection_scale);
|
|
if (projection_offset > offset)
|
|
offset = projection_offset;
|
|
mid_cut = TRUE;
|
|
}
|
|
}
|
|
if ((start == 0 && end == 0)
|
|
|| !textord_fast_pitch_test
|
|
|| (x - projection_left - start) % pitch <= end)
|
|
cutpts[x - array_origin].assign (cutpts, array_origin, x,
|
|
faking, mid_cut, offset, projection,
|
|
projection_scale, zero_count, pitch,
|
|
pitch_error);
|
|
else
|
|
cutpts[x - array_origin].assign_cheap (cutpts, array_origin, x,
|
|
faking, mid_cut, offset,
|
|
projection, projection_scale,
|
|
zero_count, pitch,
|
|
pitch_error);
|
|
x++;
|
|
if (next_zero < x || next_zero == x + zero_offset)
|
|
next_zero = x + zero_offset + 1;
|
|
if (projection->pile_count (x + zero_offset) <= zero_count)
|
|
next_zero = x + zero_offset;
|
|
}
|
|
|
|
best_fake = MAX_INT16;
|
|
best_cost = MAX_INT32;
|
|
best_count = MAX_INT16;
|
|
while (x < right_edge + pitch) {
|
|
offset = x < right_edge ? right_edge - x : 0;
|
|
cutpts[x - array_origin].assign (cutpts, array_origin, x,
|
|
FALSE, FALSE, offset, projection,
|
|
projection_scale, zero_count, pitch,
|
|
pitch_error);
|
|
cutpts[x - array_origin].terminal = TRUE;
|
|
if (cutpts[x - array_origin].index () +
|
|
cutpts[x - array_origin].fake_count <= best_count + best_fake) {
|
|
if (cutpts[x - array_origin].fake_count < best_fake
|
|
|| (cutpts[x - array_origin].fake_count == best_fake
|
|
&& cutpts[x - array_origin].cost_function () < best_cost)) {
|
|
best_fake = cutpts[x - array_origin].fake_count;
|
|
best_cost = cutpts[x - array_origin].cost_function ();
|
|
best_left_x = x;
|
|
best_right_x = x;
|
|
best_count = cutpts[x - array_origin].index ();
|
|
}
|
|
else if (cutpts[x - array_origin].fake_count == best_fake
|
|
&& x == best_right_x + 1
|
|
&& cutpts[x - array_origin].cost_function () == best_cost) {
|
|
//exactly equal
|
|
best_right_x = x;
|
|
}
|
|
}
|
|
x++;
|
|
}
|
|
ASSERT_HOST (best_fake < MAX_INT16);
|
|
|
|
best_end = &cutpts[(best_left_x + best_right_x) / 2 - array_origin];
|
|
// for (x=left_edge-pitch;x<right_edge+pitch;x++)
|
|
// {
|
|
// tprintf("x=%d, C=%g, s=%g, sq=%g, prev=%d\n",
|
|
// x,cutpts[x-array_origin].cost_function(),
|
|
// cutpts[x-array_origin].sum(),
|
|
// cutpts[x-array_origin].squares(),
|
|
// cutpts[x-array_origin].previous()->position());
|
|
// }
|
|
occupation_count = -1;
|
|
do {
|
|
for (x = best_end->position () - pitch + pitch_error;
|
|
x < best_end->position () - pitch_error
|
|
&& projection->pile_count (x) == 0; x++);
|
|
if (x < best_end->position () - pitch_error)
|
|
occupation_count++;
|
|
//copy it
|
|
segpt = new FPSEGPT (best_end);
|
|
seg_it.add_before_then_move (segpt);
|
|
best_end = best_end->previous ();
|
|
}
|
|
while (best_end != NULL);
|
|
seg_it.move_to_last ();
|
|
mean_sum = seg_it.data ()->sum ();
|
|
mean_sum = mean_sum * mean_sum / best_count;
|
|
if (seg_it.data ()->squares () - mean_sum < 0)
|
|
tprintf ("Impossible sqsum=%g, mean=%g, total=%d\n",
|
|
seg_it.data ()->squares (), seg_it.data ()->sum (), best_count);
|
|
free_mem(mins);
|
|
free_mem(cutpts);
|
|
return seg_it.data ()->squares () - mean_sum;
|
|
}
|