tesseract/ccmain/thresholder.h

///////////////////////////////////////////////////////////////////////
// File:        thresholder.h
// Description: Base API for thresolding images in tesseract.
// Author:      Ray Smith
// Created:     Mon May 12 11:00:15 PDT 2008
//
// (C) Copyright 2008, Google Inc.
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
// http://www.apache.org/licenses/LICENSE-2.0
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.
//
///////////////////////////////////////////////////////////////////////

#ifndef TESSERACT_CCMAIN_THRESHOLDER_H_
#define TESSERACT_CCMAIN_THRESHOLDER_H_

#include "platform.h"
#include "publictypes.h"

struct Pix;

namespace tesseract {

/// Base class for all tesseract image thresholding classes.
/// Specific classes can add new thresholding methods by
/// overriding ThresholdToPix.
/// Each instance deals with a single image, but the design is intended to
/// be useful for multiple calls to SetRectangle and ThresholdTo* if
/// desired.
class TESS_API ImageThresholder {
 public:
  ImageThresholder();
  virtual ~ImageThresholder();

  /// Destroy the Pix if there is one, freeing memory.
  virtual void Clear();

  /// Return true if no image has been set.
  bool IsEmpty() const;

  /// SetImage makes a copy of all the image data, so it may be deleted
  /// immediately after this call.
  /// Greyscale of 8 and color of 24 or 32 bits per pixel may be given.
  /// Palette color images will not work properly and must be converted to
  /// 24 bit.
  /// Binary images of 1 bit per pixel may also be given but they must be
  /// byte packed with the MSB of the first byte being the first pixel, and a
  /// one pixel is WHITE. For binary images set bytes_per_pixel=0.
  void SetImage(const unsigned char* imagedata, int width, int height,
                int bytes_per_pixel, int bytes_per_line);

  /// Store the coordinates of the rectangle to process for later use.
  /// Doesn't actually do any thresholding.
  void SetRectangle(int left, int top, int width, int height);

  /// Get enough parameters to be able to rebuild bounding boxes in the
  /// original image (not just within the rectangle).
  /// Left and top are enough with top-down coordinates, but
  /// the height of the rectangle and the image are needed for bottom-up.
  virtual void GetImageSizes(int* left, int* top, int* width, int* height,
                             int* imagewidth, int* imageheight);

  /// Return true if the source image is color.
  bool IsColor() const {
    return pix_channels_ >= 3;
  }

  /// Returns true if the source image is binary.
  bool IsBinary() const {
    return pix_channels_ == 0;
  }

  int GetScaleFactor() const {
    return scale_;
  }

  // Set the resolution of the source image in pixels per inch.
  // This should be called right after SetImage(), and will let us return
  // appropriate font sizes for the text.
  void SetSourceYResolution(int ppi) {
    yres_ = ppi;
    estimated_res_ = ppi;
  }
  int GetSourceYResolution() const {
    return yres_;
  }
  int GetScaledYResolution() const {
    return scale_ * yres_;
  }
  // Set the resolution of the source image in pixels per inch, as estimated
  // by the thresholder from the text size found during thresholding.
  // This value will be used to set internal size thresholds during recognition
  // and will not influence the output "point size." The default value is
  // the same as the source resolution. (yres_)
  void SetEstimatedResolution(int ppi) {
    estimated_res_ = ppi;
  }
  // Returns the estimated resolution, including any active scaling.
  // This value will be used to set internal size thresholds during recognition.
  int GetScaledEstimatedResolution() const {
    return scale_ * estimated_res_;
  }

  /// Pix vs raw, which to use? Pix is the preferred input for efficiency,
  /// since raw buffers are copied.
  /// SetImage for Pix clones its input, so the source pix may be pixDestroyed
  /// immediately after, but may not go away until after the Thresholder has
  /// finished with it.
  void SetImage(const Pix* pix);

  /// Threshold the source image as efficiently as possible to the output Pix.
  /// Creates a Pix and sets pix to point to the resulting pointer.
  /// Caller must use pixDestroy to free the created Pix.
  virtual void ThresholdToPix(PageSegMode pageseg_mode, Pix** pix);

  // Gets a pix that contains an 8 bit threshold value at each pixel. The
  // returned pix may be an integer reduction of the binary image such that
  // the scale factor may be inferred from the ratio of the sizes, even down
  // to the extreme of a 1x1 pixel thresholds image.
  // Ideally the 8 bit threshold should be the exact threshold used to generate
  // the binary image in ThresholdToPix, but this is not a hard constraint.
  // Returns NULL if the input is binary. PixDestroy after use.
  virtual Pix* GetPixRectThresholds();

  /// Get a clone/copy of the source image rectangle.
  /// The returned Pix must be pixDestroyed.
  /// This function will be used in the future by the page layout analysis, and
  /// the layout analysis that uses it will only be available with Leptonica,
  /// so there is no raw equivalent.
  Pix* GetPixRect();

  // Get a clone/copy of the source image rectangle, reduced to greyscale,
  // and at the same resolution as the output binary.
  // The returned Pix must be pixDestroyed.
  // Provided to the classifier to extract features from the greyscale image.
  virtual Pix* GetPixRectGrey();

 protected:
  // ----------------------------------------------------------------------
  // Utility functions that may be useful components for other thresholders.

  /// Common initialization shared between SetImage methods.
  virtual void Init();

  /// Return true if we are processing the full image.
  bool IsFullImage() const {
    return rect_left_ == 0 && rect_top_ == 0 &&
           rect_width_ == image_width_ && rect_height_ == image_height_;
  }

  // Otsu thresholds the rectangle, taking the rectangle from *this.
  void OtsuThresholdRectToPix(Pix* src_pix, Pix** out_pix) const;

  /// Threshold the rectangle, taking everything except the src_pix
  /// from the class, using thresholds/hi_values to the output pix.
  /// NOTE that num_channels is the size of the thresholds and hi_values
  // arrays and also the bytes per pixel in src_pix.
  void ThresholdRectToPix(Pix* src_pix, int num_channels,
                          const int* thresholds, const int* hi_values,
                          Pix** pix) const;

 protected:
  /// Clone or other copy of the source Pix.
  /// The pix will always be PixDestroy()ed on destruction of the class.
  Pix*                 pix_;

  int                  image_width_;    //< Width of source pix_.
  int                  image_height_;   //< Height of source pix_.
  int                  pix_channels_;   //< Number of 8-bit channels in pix_.
  int                  pix_wpl_;        //< Words per line of pix_.
  // Limits of image rectangle to be processed.
  int                  scale_;          //< Scale factor from original image.
  int                  yres_;           //< y pixels/inch in source image.
  int                  estimated_res_;  //< Resolution estimate from text size.
  int                  rect_left_;
  int                  rect_top_;
  int                  rect_width_;
  int                  rect_height_;
};

}  // namespace tesseract.

#endif  // TESSERACT_CCMAIN_THRESHOLDER_H_
More changes to ccmain for 3.00 git-svn-id: https://tesseract-ocr.googlecode.com/svn/trunk@287 d0cd1f9f-072b-0410-8dd7-cf729c803f20 2009-07-11 10:07:25 +08:00			`///////////////////////////////////////////////////////////////////////`
			`// File: thresholder.h`
			`// Description: Base API for thresolding images in tesseract.`
			`// Author: Ray Smith`
			`// Created: Mon May 12 11:00:15 PDT 2008`
			`//`
			`// (C) Copyright 2008, Google Inc.`
			`// Licensed under the Apache License, Version 2.0 (the "License");`
			`// you may not use this file except in compliance with the License.`
			`// You may obtain a copy of the License at`
			`// http://www.apache.org/licenses/LICENSE-2.0`
			`// Unless required by applicable law or agreed to in writing, software`
			`// distributed under the License is distributed on an "AS IS" BASIS,`
			`// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.`
			`// See the License for the specific language governing permissions and`
			`// limitations under the License.`
			`//`
			`///////////////////////////////////////////////////////////////////////`

Replace reserved identifiers used in #define guards header files Use macro names as suggested by the Google C++ Style Guide (https://google.github.io/styleguide/cppguide.html#The__define_Guard). Signed-off-by: Stefan Weil <sw@weilnetz.de> 2016-12-04 21:45:26 +08:00			`#ifndef TESSERACT_CCMAIN_THRESHOLDER_H_`
			`#define TESSERACT_CCMAIN_THRESHOLDER_H_`
More changes to ccmain for 3.00 git-svn-id: https://tesseract-ocr.googlecode.com/svn/trunk@287 d0cd1f9f-072b-0410-8dd7-cf729c803f20 2009-07-11 10:07:25 +08:00
Major refactor of control.cpp to enable line recognition git-svn-id: https://tesseract-ocr.googlecode.com/svn/trunk@1147 d0cd1f9f-072b-0410-8dd7-cf729c803f20 2014-08-12 07:23:06 +08:00			`#include "platform.h"`
			`#include "publictypes.h"`
fix issue 967 git-svn-id: https://tesseract-ocr.googlecode.com/svn/trunk@886 d0cd1f9f-072b-0410-8dd7-cf729c803f20 2013-09-30 04:48:06 +08:00
More changes to ccmain for 3.00 git-svn-id: https://tesseract-ocr.googlecode.com/svn/trunk@287 d0cd1f9f-072b-0410-8dd7-cf729c803f20 2009-07-11 10:07:25 +08:00			`struct Pix;`

			`namespace tesseract {`

partial merge of doxygen branch (stuff without conflicts, basically) git-svn-id: https://tesseract-ocr.googlecode.com/svn/trunk@441 d0cd1f9f-072b-0410-8dd7-cf729c803f20 2010-07-27 21:23:23 +08:00			`/// Base class for all tesseract image thresholding classes.`
			`/// Specific classes can add new thresholding methods by`
Added sub/superscript, small/dropcap detection git-svn-id: https://tesseract-ocr.googlecode.com/svn/trunk@547 d0cd1f9f-072b-0410-8dd7-cf729c803f20 2010-12-09 09:32:20 +08:00			`/// overriding ThresholdToPix.`
partial merge of doxygen branch (stuff without conflicts, basically) git-svn-id: https://tesseract-ocr.googlecode.com/svn/trunk@441 d0cd1f9f-072b-0410-8dd7-cf729c803f20 2010-07-27 21:23:23 +08:00			`/// Each instance deals with a single image, but the design is intended to`
			`/// be useful for multiple calls to SetRectangle and ThresholdTo* if`
			`/// desired.`
fix issue 967 git-svn-id: https://tesseract-ocr.googlecode.com/svn/trunk@886 d0cd1f9f-072b-0410-8dd7-cf729c803f20 2013-09-30 04:48:06 +08:00			`class TESS_API ImageThresholder {`
More changes to ccmain for 3.00 git-svn-id: https://tesseract-ocr.googlecode.com/svn/trunk@287 d0cd1f9f-072b-0410-8dd7-cf729c803f20 2009-07-11 10:07:25 +08:00			`public:`
			`ImageThresholder();`
			`virtual ~ImageThresholder();`

partial merge of doxygen branch (stuff without conflicts, basically) git-svn-id: https://tesseract-ocr.googlecode.com/svn/trunk@441 d0cd1f9f-072b-0410-8dd7-cf729c803f20 2010-07-27 21:23:23 +08:00			`/// Destroy the Pix if there is one, freeing memory.`
More changes to ccmain for 3.00 git-svn-id: https://tesseract-ocr.googlecode.com/svn/trunk@287 d0cd1f9f-072b-0410-8dd7-cf729c803f20 2009-07-11 10:07:25 +08:00			`virtual void Clear();`

partial merge of doxygen branch (stuff without conflicts, basically) git-svn-id: https://tesseract-ocr.googlecode.com/svn/trunk@441 d0cd1f9f-072b-0410-8dd7-cf729c803f20 2010-07-27 21:23:23 +08:00			`/// Return true if no image has been set.`
More changes to ccmain for 3.00 git-svn-id: https://tesseract-ocr.googlecode.com/svn/trunk@287 d0cd1f9f-072b-0410-8dd7-cf729c803f20 2009-07-11 10:07:25 +08:00			`bool IsEmpty() const;`

Removed dependence on IMAGE class git-svn-id: https://tesseract-ocr.googlecode.com/svn/trunk@955 d0cd1f9f-072b-0410-8dd7-cf729c803f20 2014-01-10 01:45:57 +08:00			`/// SetImage makes a copy of all the image data, so it may be deleted`
			`/// immediately after this call.`
partial merge of doxygen branch (stuff without conflicts, basically) git-svn-id: https://tesseract-ocr.googlecode.com/svn/trunk@441 d0cd1f9f-072b-0410-8dd7-cf729c803f20 2010-07-27 21:23:23 +08:00			`/// Greyscale of 8 and color of 24 or 32 bits per pixel may be given.`
			`/// Palette color images will not work properly and must be converted to`
			`/// 24 bit.`
			`/// Binary images of 1 bit per pixel may also be given but they must be`
			`/// byte packed with the MSB of the first byte being the first pixel, and a`
			`/// one pixel is WHITE. For binary images set bytes_per_pixel=0.`
More changes to ccmain for 3.00 git-svn-id: https://tesseract-ocr.googlecode.com/svn/trunk@287 d0cd1f9f-072b-0410-8dd7-cf729c803f20 2009-07-11 10:07:25 +08:00			`void SetImage(const unsigned char* imagedata, int width, int height,`
			`int bytes_per_pixel, int bytes_per_line);`

partial merge of doxygen branch (stuff without conflicts, basically) git-svn-id: https://tesseract-ocr.googlecode.com/svn/trunk@441 d0cd1f9f-072b-0410-8dd7-cf729c803f20 2010-07-27 21:23:23 +08:00			`/// Store the coordinates of the rectangle to process for later use.`
			`/// Doesn't actually do any thresholding.`
More changes to ccmain for 3.00 git-svn-id: https://tesseract-ocr.googlecode.com/svn/trunk@287 d0cd1f9f-072b-0410-8dd7-cf729c803f20 2009-07-11 10:07:25 +08:00			`void SetRectangle(int left, int top, int width, int height);`

partial merge of doxygen branch (stuff without conflicts, basically) git-svn-id: https://tesseract-ocr.googlecode.com/svn/trunk@441 d0cd1f9f-072b-0410-8dd7-cf729c803f20 2010-07-27 21:23:23 +08:00			`/// Get enough parameters to be able to rebuild bounding boxes in the`
			`/// original image (not just within the rectangle).`
			`/// Left and top are enough with top-down coordinates, but`
			`/// the height of the rectangle and the image are needed for bottom-up.`
More changes to ccmain for 3.00 git-svn-id: https://tesseract-ocr.googlecode.com/svn/trunk@287 d0cd1f9f-072b-0410-8dd7-cf729c803f20 2009-07-11 10:07:25 +08:00			`virtual void GetImageSizes(int* left, int* top, int* width, int* height,`
			`int* imagewidth, int* imageheight);`

partial merge of doxygen branch (stuff without conflicts, basically) git-svn-id: https://tesseract-ocr.googlecode.com/svn/trunk@441 d0cd1f9f-072b-0410-8dd7-cf729c803f20 2010-07-27 21:23:23 +08:00			`/// Return true if the source image is color.`
More changes to ccmain for 3.00 git-svn-id: https://tesseract-ocr.googlecode.com/svn/trunk@287 d0cd1f9f-072b-0410-8dd7-cf729c803f20 2009-07-11 10:07:25 +08:00			`bool IsColor() const {`
Removed dependence on IMAGE class git-svn-id: https://tesseract-ocr.googlecode.com/svn/trunk@955 d0cd1f9f-072b-0410-8dd7-cf729c803f20 2014-01-10 01:45:57 +08:00			`return pix_channels_ >= 3;`
More changes to ccmain for 3.00 git-svn-id: https://tesseract-ocr.googlecode.com/svn/trunk@287 d0cd1f9f-072b-0410-8dd7-cf729c803f20 2009-07-11 10:07:25 +08:00			`}`

3.01 code from http://github.com/jimregan/tesseract-ocr with addaptions related to Linux and Windows (VC2008) compile process git-svn-id: https://tesseract-ocr.googlecode.com/svn/trunk@526 d0cd1f9f-072b-0410-8dd7-cf729c803f20 2010-11-24 02:34:14 +08:00			`/// Returns true if the source image is binary.`
			`bool IsBinary() const {`
Removed dependence on IMAGE class git-svn-id: https://tesseract-ocr.googlecode.com/svn/trunk@955 d0cd1f9f-072b-0410-8dd7-cf729c803f20 2014-01-10 01:45:57 +08:00			`return pix_channels_ == 0;`
3.01 code from http://github.com/jimregan/tesseract-ocr with addaptions related to Linux and Windows (VC2008) compile process git-svn-id: https://tesseract-ocr.googlecode.com/svn/trunk@526 d0cd1f9f-072b-0410-8dd7-cf729c803f20 2010-11-24 02:34:14 +08:00			`}`

Added sub/superscript, small/dropcap detection git-svn-id: https://tesseract-ocr.googlecode.com/svn/trunk@547 d0cd1f9f-072b-0410-8dd7-cf729c803f20 2010-12-09 09:32:20 +08:00			`int GetScaleFactor() const {`
			`return scale_;`
			`}`
Added Right-to-left/Bidi capability in the output iterators for Hebrew/Arabic, Added paragraph detection in layout analysis/post OCR, Fixed inconsistent xheight during training and over-chopping, Added simultaneous multi-language capability, Refactored top-level word recognition module, Fixed problems with internally scaled images git-svn-id: https://tesseract-ocr.googlecode.com/svn/trunk@651 d0cd1f9f-072b-0410-8dd7-cf729c803f20 2012-02-02 10:59:49 +08:00
			`// Set the resolution of the source image in pixels per inch.`
			`// This should be called right after SetImage(), and will let us return`
			`// appropriate font sizes for the text.`
			`void SetSourceYResolution(int ppi) {`
			`yres_ = ppi;`
			`estimated_res_ = ppi;`
			`}`
Added sub/superscript, small/dropcap detection git-svn-id: https://tesseract-ocr.googlecode.com/svn/trunk@547 d0cd1f9f-072b-0410-8dd7-cf729c803f20 2010-12-09 09:32:20 +08:00			`int GetSourceYResolution() const {`
			`return yres_;`
			`}`
			`int GetScaledYResolution() const {`
			`return scale_ * yres_;`
			`}`
Added Right-to-left/Bidi capability in the output iterators for Hebrew/Arabic, Added paragraph detection in layout analysis/post OCR, Fixed inconsistent xheight during training and over-chopping, Added simultaneous multi-language capability, Refactored top-level word recognition module, Fixed problems with internally scaled images git-svn-id: https://tesseract-ocr.googlecode.com/svn/trunk@651 d0cd1f9f-072b-0410-8dd7-cf729c803f20 2012-02-02 10:59:49 +08:00			`// Set the resolution of the source image in pixels per inch, as estimated`
			`// by the thresholder from the text size found during thresholding.`
			`// This value will be used to set internal size thresholds during recognition`
			`// and will not influence the output "point size." The default value is`
			`// the same as the source resolution. (yres_)`
			`void SetEstimatedResolution(int ppi) {`
			`estimated_res_ = ppi;`
			`}`
			`// Returns the estimated resolution, including any active scaling.`
			`// This value will be used to set internal size thresholds during recognition.`
			`int GetScaledEstimatedResolution() const {`
			`return scale_ * estimated_res_;`
			`}`
More changes to ccmain for 3.00 git-svn-id: https://tesseract-ocr.googlecode.com/svn/trunk@287 d0cd1f9f-072b-0410-8dd7-cf729c803f20 2009-07-11 10:07:25 +08:00
Removed dependence on IMAGE class git-svn-id: https://tesseract-ocr.googlecode.com/svn/trunk@955 d0cd1f9f-072b-0410-8dd7-cf729c803f20 2014-01-10 01:45:57 +08:00			`/// Pix vs raw, which to use? Pix is the preferred input for efficiency,`
			`/// since raw buffers are copied.`
			`/// SetImage for Pix clones its input, so the source pix may be pixDestroyed`
			`/// immediately after, but may not go away until after the Thresholder has`
			`/// finished with it.`
More changes to ccmain for 3.00 git-svn-id: https://tesseract-ocr.googlecode.com/svn/trunk@287 d0cd1f9f-072b-0410-8dd7-cf729c803f20 2009-07-11 10:07:25 +08:00			`void SetImage(const Pix* pix);`

partial merge of doxygen branch (stuff without conflicts, basically) git-svn-id: https://tesseract-ocr.googlecode.com/svn/trunk@441 d0cd1f9f-072b-0410-8dd7-cf729c803f20 2010-07-27 21:23:23 +08:00			`/// Threshold the source image as efficiently as possible to the output Pix.`
			`/// Creates a Pix and sets pix to point to the resulting pointer.`
			`/// Caller must use pixDestroy to free the created Pix.`
Major refactor of control.cpp to enable line recognition git-svn-id: https://tesseract-ocr.googlecode.com/svn/trunk@1147 d0cd1f9f-072b-0410-8dd7-cf729c803f20 2014-08-12 07:23:06 +08:00			`virtual void ThresholdToPix(PageSegMode pageseg_mode, Pix** pix);`
More changes to ccmain for 3.00 git-svn-id: https://tesseract-ocr.googlecode.com/svn/trunk@287 d0cd1f9f-072b-0410-8dd7-cf729c803f20 2009-07-11 10:07:25 +08:00
Generalized feature extractor to allow fx from greyscale git-svn-id: https://tesseract-ocr.googlecode.com/svn/trunk@875 d0cd1f9f-072b-0410-8dd7-cf729c803f20 2013-09-23 23:19:50 +08:00			`// Gets a pix that contains an 8 bit threshold value at each pixel. The`
			`// returned pix may be an integer reduction of the binary image such that`
			`// the scale factor may be inferred from the ratio of the sizes, even down`
			`// to the extreme of a 1x1 pixel thresholds image.`
			`// Ideally the 8 bit threshold should be the exact threshold used to generate`
			`// the binary image in ThresholdToPix, but this is not a hard constraint.`
			`// Returns NULL if the input is binary. PixDestroy after use.`
			`virtual Pix* GetPixRectThresholds();`

partial merge of doxygen branch (stuff without conflicts, basically) git-svn-id: https://tesseract-ocr.googlecode.com/svn/trunk@441 d0cd1f9f-072b-0410-8dd7-cf729c803f20 2010-07-27 21:23:23 +08:00			`/// Get a clone/copy of the source image rectangle.`
			`/// The returned Pix must be pixDestroyed.`
			`/// This function will be used in the future by the page layout analysis, and`
			`/// the layout analysis that uses it will only be available with Leptonica,`
			`/// so there is no raw equivalent.`
More changes to ccmain for 3.00 git-svn-id: https://tesseract-ocr.googlecode.com/svn/trunk@287 d0cd1f9f-072b-0410-8dd7-cf729c803f20 2009-07-11 10:07:25 +08:00			`Pix* GetPixRect();`
3.01 code from http://github.com/jimregan/tesseract-ocr with addaptions related to Linux and Windows (VC2008) compile process git-svn-id: https://tesseract-ocr.googlecode.com/svn/trunk@526 d0cd1f9f-072b-0410-8dd7-cf729c803f20 2010-11-24 02:34:14 +08:00
Generalized feature extractor to allow fx from greyscale git-svn-id: https://tesseract-ocr.googlecode.com/svn/trunk@875 d0cd1f9f-072b-0410-8dd7-cf729c803f20 2013-09-23 23:19:50 +08:00			`// Get a clone/copy of the source image rectangle, reduced to greyscale,`
			`// and at the same resolution as the output binary.`
			`// The returned Pix must be pixDestroyed.`
			`// Provided to the classifier to extract features from the greyscale image.`
			`virtual Pix* GetPixRectGrey();`
More changes to ccmain for 3.00 git-svn-id: https://tesseract-ocr.googlecode.com/svn/trunk@287 d0cd1f9f-072b-0410-8dd7-cf729c803f20 2009-07-11 10:07:25 +08:00
			`protected:`
			`// ----------------------------------------------------------------------`
			`// Utility functions that may be useful components for other thresholders.`

partial merge of doxygen branch (stuff without conflicts, basically) git-svn-id: https://tesseract-ocr.googlecode.com/svn/trunk@441 d0cd1f9f-072b-0410-8dd7-cf729c803f20 2010-07-27 21:23:23 +08:00			`/// Common initialization shared between SetImage methods.`
More changes to ccmain for 3.00 git-svn-id: https://tesseract-ocr.googlecode.com/svn/trunk@287 d0cd1f9f-072b-0410-8dd7-cf729c803f20 2009-07-11 10:07:25 +08:00			`virtual void Init();`

partial merge of doxygen branch (stuff without conflicts, basically) git-svn-id: https://tesseract-ocr.googlecode.com/svn/trunk@441 d0cd1f9f-072b-0410-8dd7-cf729c803f20 2010-07-27 21:23:23 +08:00			`/// Return true if we are processing the full image.`
More changes to ccmain for 3.00 git-svn-id: https://tesseract-ocr.googlecode.com/svn/trunk@287 d0cd1f9f-072b-0410-8dd7-cf729c803f20 2009-07-11 10:07:25 +08:00			`bool IsFullImage() const {`
			`return rect_left_ == 0 && rect_top_ == 0 &&`
			`rect_width_ == image_width_ && rect_height_ == image_height_;`
			`}`

Removed dependence on IMAGE class git-svn-id: https://tesseract-ocr.googlecode.com/svn/trunk@955 d0cd1f9f-072b-0410-8dd7-cf729c803f20 2014-01-10 01:45:57 +08:00			`// Otsu thresholds the rectangle, taking the rectangle from *this.`
			`void OtsuThresholdRectToPix(Pix* src_pix, Pix** out_pix) const;`
More changes to ccmain for 3.00 git-svn-id: https://tesseract-ocr.googlecode.com/svn/trunk@287 d0cd1f9f-072b-0410-8dd7-cf729c803f20 2009-07-11 10:07:25 +08:00
Removed dependence on IMAGE class git-svn-id: https://tesseract-ocr.googlecode.com/svn/trunk@955 d0cd1f9f-072b-0410-8dd7-cf729c803f20 2014-01-10 01:45:57 +08:00			`/// Threshold the rectangle, taking everything except the src_pix`
			`/// from the class, using thresholds/hi_values to the output pix.`
			`/// NOTE that num_channels is the size of the thresholds and hi_values`
			`// arrays and also the bytes per pixel in src_pix.`
			`void ThresholdRectToPix(Pix* src_pix, int num_channels,`
More changes to ccmain for 3.00 git-svn-id: https://tesseract-ocr.googlecode.com/svn/trunk@287 d0cd1f9f-072b-0410-8dd7-cf729c803f20 2009-07-11 10:07:25 +08:00			`const int* thresholds, const int* hi_values,`
			`Pix** pix) const;`

			`protected:`
partial merge of doxygen branch (stuff without conflicts, basically) git-svn-id: https://tesseract-ocr.googlecode.com/svn/trunk@441 d0cd1f9f-072b-0410-8dd7-cf729c803f20 2010-07-27 21:23:23 +08:00			`/// Clone or other copy of the source Pix.`
			`/// The pix will always be PixDestroy()ed on destruction of the class.`
More changes to ccmain for 3.00 git-svn-id: https://tesseract-ocr.googlecode.com/svn/trunk@287 d0cd1f9f-072b-0410-8dd7-cf729c803f20 2009-07-11 10:07:25 +08:00			`Pix* pix_;`

Removed dependence on IMAGE class git-svn-id: https://tesseract-ocr.googlecode.com/svn/trunk@955 d0cd1f9f-072b-0410-8dd7-cf729c803f20 2014-01-10 01:45:57 +08:00			`int image_width_; //< Width of source pix_.`
			`int image_height_; //< Height of source pix_.`
			`int pix_channels_; //< Number of 8-bit channels in pix_.`
			`int pix_wpl_; //< Words per line of pix_.`
More changes to ccmain for 3.00 git-svn-id: https://tesseract-ocr.googlecode.com/svn/trunk@287 d0cd1f9f-072b-0410-8dd7-cf729c803f20 2009-07-11 10:07:25 +08:00			`// Limits of image rectangle to be processed.`
Added sub/superscript, small/dropcap detection git-svn-id: https://tesseract-ocr.googlecode.com/svn/trunk@547 d0cd1f9f-072b-0410-8dd7-cf729c803f20 2010-12-09 09:32:20 +08:00			`int scale_; //< Scale factor from original image.`
Added Right-to-left/Bidi capability in the output iterators for Hebrew/Arabic, Added paragraph detection in layout analysis/post OCR, Fixed inconsistent xheight during training and over-chopping, Added simultaneous multi-language capability, Refactored top-level word recognition module, Fixed problems with internally scaled images git-svn-id: https://tesseract-ocr.googlecode.com/svn/trunk@651 d0cd1f9f-072b-0410-8dd7-cf729c803f20 2012-02-02 10:59:49 +08:00			`int yres_; //< y pixels/inch in source image.`
			`int estimated_res_; //< Resolution estimate from text size.`
More changes to ccmain for 3.00 git-svn-id: https://tesseract-ocr.googlecode.com/svn/trunk@287 d0cd1f9f-072b-0410-8dd7-cf729c803f20 2009-07-11 10:07:25 +08:00			`int rect_left_;`
			`int rect_top_;`
			`int rect_width_;`
			`int rect_height_;`
			`};`

			`} // namespace tesseract.`

Replace reserved identifiers used in #define guards header files Use macro names as suggested by the Google C++ Style Guide (https://google.github.io/styleguide/cppguide.html#The__define_Guard). Signed-off-by: Stefan Weil <sw@weilnetz.de> 2016-12-04 21:45:26 +08:00			`#endif // TESSERACT_CCMAIN_THRESHOLDER_H_`