mirror of
https://github.com/tesseract-ocr/tesseract.git
synced 2025-01-11 05:27:49 +08:00
42144b9698
git-svn-id: https://tesseract-ocr.googlecode.com/svn/trunk@870 d0cd1f9f-072b-0410-8dd7-cf729c803f20
165 lines
7.6 KiB
C++
165 lines
7.6 KiB
C++
///////////////////////////////////////////////////////////////////////
|
|
// File: detlinefit.h
|
|
// Description: Deterministic least upper-quartile squares line fitting.
|
|
// Author: Ray Smith
|
|
// Created: Thu Feb 28 14:35:01 PDT 2008
|
|
//
|
|
// (C) Copyright 2008, Google Inc.
|
|
// Licensed under the Apache License, Version 2.0 (the "License");
|
|
// you may not use this file except in compliance with the License.
|
|
// You may obtain a copy of the License at
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
// Unless required by applicable law or agreed to in writing, software
|
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
// See the License for the specific language governing permissions and
|
|
// limitations under the License.
|
|
//
|
|
///////////////////////////////////////////////////////////////////////
|
|
|
|
#ifndef TESSERACT_CCSTRUCT_DETLINEFIT_H_
|
|
#define TESSERACT_CCSTRUCT_DETLINEFIT_H_
|
|
|
|
#include "genericvector.h"
|
|
#include "kdpair.h"
|
|
#include "points.h"
|
|
|
|
namespace tesseract {
|
|
|
|
// This class fits a line to a set of ICOORD points.
|
|
// There is no restriction on the direction of the line, as it
|
|
// uses a vector method, ie no concern over infinite gradients.
|
|
// The fitted line has the least upper quartile of squares of perpendicular
|
|
// distances of all source points from the line, subject to the constraint
|
|
// that the line is made from one of the pairs of [{p1,p2,p3},{pn-2, pn-1, pn}]
|
|
// i.e. the 9 combinations of one of the first 3 and last 3 points.
|
|
// A fundamental assumption of this algorithm is that one of the first 3 and
|
|
// one of the last 3 points are near the best line fit.
|
|
// The points must be Added in line order for the algorithm to work properly.
|
|
// No floating point calculations are needed* to make an accurate fit,
|
|
// and no random numbers are needed** so the algorithm is deterministic,
|
|
// architecture-stable, and compiler-stable as well as stable to minor
|
|
// changes in the input.
|
|
// *A single floating point division is used to compute each line's distance.
|
|
// This is unlikely to result in choice of a different line, but if it does,
|
|
// it would be easy to replace with a 64 bit integer calculation.
|
|
// **Random numbers are used in the nth_item function, but the worst
|
|
// non-determinism that can result is picking a different result among equals,
|
|
// and that wouldn't make any difference to the end-result distance, so the
|
|
// randomness does not affect the determinism of the algorithm. The random
|
|
// numbers are only there to guarantee average linear time.
|
|
// Fitting time is linear, but with a high constant, as it tries 9 different
|
|
// lines and computes the distance of all points each time.
|
|
// This class is aimed at replacing the LLSQ (linear least squares) and
|
|
// LMS (least median of squares) classes that are currently used for most
|
|
// of the line fitting in Tesseract.
|
|
class DetLineFit {
|
|
public:
|
|
DetLineFit();
|
|
~DetLineFit();
|
|
|
|
// Delete all Added points.
|
|
void Clear();
|
|
|
|
// Adds a new point. Takes a copy - the pt doesn't need to stay in scope.
|
|
// Add must be called on points in sequence along the line.
|
|
void Add(const ICOORD& pt);
|
|
// Associates a half-width with the given point if a point overlaps the
|
|
// previous point by more than half the width, and its distance is further
|
|
// than the previous point, then the more distant point is ignored in the
|
|
// distance calculation. Useful for ignoring i dots and other diacritics.
|
|
void Add(const ICOORD& pt, int halfwidth);
|
|
|
|
// Fits a line to the points, returning the fitted line as a pair of
|
|
// points, and the upper quartile error.
|
|
double Fit(ICOORD* pt1, ICOORD* pt2) {
|
|
return Fit(0, 0, pt1, pt2);
|
|
}
|
|
// Fits a line to the points, ignoring the skip_first initial points and the
|
|
// skip_last final points, returning the fitted line as a pair of points,
|
|
// and the upper quartile error.
|
|
double Fit(int skip_first, int skip_last, ICOORD* pt1, ICOORD* pt2);
|
|
|
|
// Constrained fit with a supplied direction vector. Finds the best line_pt,
|
|
// that is one of the supplied points having the median cross product with
|
|
// direction, ignoring points that have a cross product outside of the range
|
|
// [min_dist, max_dist]. Returns the resulting error metric using the same
|
|
// reduced set of points.
|
|
// *Makes use of floating point arithmetic*
|
|
double ConstrainedFit(const FCOORD& direction,
|
|
double min_dist, double max_dist,
|
|
bool debug, ICOORD* line_pt);
|
|
|
|
// Returns true if there were enough points at the last call to Fit or
|
|
// ConstrainedFit for the fitted points to be used on a badly fitted line.
|
|
bool SufficientPointsForIndependentFit() const;
|
|
|
|
// Backwards compatible fit returning a gradient and constant.
|
|
// Deprecated. Prefer Fit(ICOORD*, ICOORD*) where possible, but use this
|
|
// function in preference to the LMS class.
|
|
double Fit(float* m, float* c);
|
|
|
|
// Backwards compatible constrained fit with a supplied gradient.
|
|
// Deprecated. Use ConstrainedFit(const FCOORD& direction) where possible
|
|
// to avoid potential difficulties with infinite gradients.
|
|
double ConstrainedFit(double m, float* c);
|
|
|
|
private:
|
|
// Simple struct to hold an ICOORD point and a halfwidth representing half
|
|
// the "width" (supposedly approximately parallel to the direction of the
|
|
// line) of each point, such that distant points can be discarded when they
|
|
// overlap nearer points. (Think i dot and other diacritics or noise.)
|
|
struct PointWidth {
|
|
PointWidth() : pt(ICOORD(0, 0)), halfwidth(0) {}
|
|
PointWidth(const ICOORD& pt0, int halfwidth0)
|
|
: pt(pt0), halfwidth(halfwidth0) {}
|
|
|
|
ICOORD pt;
|
|
int halfwidth;
|
|
};
|
|
// Type holds the distance of each point from the fitted line and the point
|
|
// itself. Use of double allows integer distances from ICOORDs to be stored
|
|
// exactly, and also the floating point results from ConstrainedFit.
|
|
typedef KDPairInc<double, ICOORD> DistPointPair;
|
|
|
|
// Computes and returns the squared evaluation metric for a line fit.
|
|
double EvaluateLineFit();
|
|
|
|
// Computes the absolute values of the precomputed distances_,
|
|
// and returns the squared upper-quartile error distance.
|
|
double ComputeUpperQuartileError();
|
|
|
|
// Returns the number of sample points that have an error more than threshold.
|
|
int NumberOfMisfittedPoints(double threshold) const;
|
|
|
|
// Computes all the cross product distances of the points from the line,
|
|
// storing the actual (signed) cross products in distances_.
|
|
// Ignores distances of points that are further away than the previous point,
|
|
// and overlaps the previous point by at least half.
|
|
void ComputeDistances(const ICOORD& start, const ICOORD& end);
|
|
|
|
// Computes all the cross product distances of the points perpendicular to
|
|
// the given direction, ignoring distances outside of the give distance range,
|
|
// storing the actual (signed) cross products in distances_.
|
|
void ComputeConstrainedDistances(const FCOORD& direction,
|
|
double min_dist, double max_dist);
|
|
|
|
// Stores all the source points in the order they were given and their
|
|
// halfwidths, if any.
|
|
GenericVector<PointWidth> pts_;
|
|
// Stores the computed perpendicular distances of (some of) the pts_ from a
|
|
// given vector (assuming it goes through the origin, making it a line).
|
|
// Since the distances may be a subset of the input points, and get
|
|
// re-ordered by the nth_item function, the original point is stored
|
|
// along side the distance.
|
|
GenericVector<DistPointPair> distances_; // Distances of points.
|
|
// The squared length of the vector used to compute distances_.
|
|
double square_length_;
|
|
};
|
|
|
|
} // namespace tesseract.
|
|
|
|
#endif // TESSERACT_CCSTRUCT_DETLINEFIT_H_
|
|
|
|
|