mirror of
https://github.com/tesseract-ocr/tesseract.git
synced 2025-01-18 22:43:45 +08:00
84920b92b3
Font recognition was poor, due to forcing a 1st and 2nd choice at a character level, when the total score for the correct font is often correct at the word level, so allowed the propagation of a full set of fonts and scores to the word recognizer, which can now decide word level fonts using the scores instead of simple votes. Change precipitated a cleanup of output data structures for classifier results, eliminating ScoredClass and INT_RESULT_STRUCT, with a few extra elements going in UnicharRating, and using that wherever possible. That added the extra complexity of 1-rating due to a flip between 0 is good and 0 is bad for the internal classifier scores before they are converted to rating and certainty.
190 lines
7.3 KiB
C++
190 lines
7.3 KiB
C++
///////////////////////////////////////////////////////////////////////
|
|
// File: fontinfo.h
|
|
// Description: Font information classes abstracted from intproto.h/cpp.
|
|
// Author: rays@google.com (Ray Smith)
|
|
// Created: Tue May 17 17:08:01 PDT 2011
|
|
//
|
|
// (C) Copyright 2011, Google Inc.
|
|
// Licensed under the Apache License, Version 2.0 (the "License");
|
|
// you may not use this file except in compliance with the License.
|
|
// You may obtain a copy of the License at
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
// Unless required by applicable law or agreed to in writing, software
|
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
// See the License for the specific language governing permissions and
|
|
// limitations under the License.
|
|
//
|
|
///////////////////////////////////////////////////////////////////////
|
|
|
|
|
|
#ifndef TESSERACT_CCSTRUCT_FONTINFO_H_
|
|
#define TESSERACT_CCSTRUCT_FONTINFO_H_
|
|
|
|
#include "genericvector.h"
|
|
#include "host.h"
|
|
#include "unichar.h"
|
|
|
|
template <typename T> class UnicityTable;
|
|
|
|
namespace tesseract {
|
|
|
|
class BitVector;
|
|
|
|
// Simple struct to hold a font and a score. The scores come from the low-level
|
|
// integer matcher, so they are in the uinT16 range. Fonts are an index to
|
|
// fontinfo_table.
|
|
// These get copied around a lot, so best to keep them small.
|
|
struct ScoredFont {
|
|
ScoredFont() : fontinfo_id(-1), score(0) {}
|
|
ScoredFont(int font_id, uinT16 classifier_score)
|
|
: fontinfo_id(font_id), score(classifier_score) {}
|
|
|
|
// Index into fontinfo table, but inside the classifier, may be a shapetable
|
|
// index.
|
|
inT32 fontinfo_id;
|
|
// Raw score from the low-level classifier.
|
|
uinT16 score;
|
|
};
|
|
|
|
// Struct for information about spacing between characters in a particular font.
|
|
struct FontSpacingInfo {
|
|
inT16 x_gap_before;
|
|
inT16 x_gap_after;
|
|
GenericVector<UNICHAR_ID> kerned_unichar_ids;
|
|
GenericVector<inT16> kerned_x_gaps;
|
|
};
|
|
|
|
/*
|
|
* font_properties contains properties about boldness, italicness, fixed pitch,
|
|
* serif, fraktur
|
|
*/
|
|
struct FontInfo {
|
|
FontInfo() : name(NULL), properties(0), universal_id(0), spacing_vec(NULL) {}
|
|
~FontInfo() {}
|
|
|
|
// Writes to the given file. Returns false in case of error.
|
|
bool Serialize(FILE* fp) const;
|
|
// Reads from the given file. Returns false in case of error.
|
|
// If swap is true, assumes a big/little-endian swap is needed.
|
|
bool DeSerialize(bool swap, FILE* fp);
|
|
|
|
// Reserves unicharset_size spots in spacing_vec.
|
|
void init_spacing(int unicharset_size) {
|
|
spacing_vec = new GenericVector<FontSpacingInfo *>();
|
|
spacing_vec->init_to_size(unicharset_size, NULL);
|
|
}
|
|
// Adds the given pointer to FontSpacingInfo to spacing_vec member
|
|
// (FontInfo class takes ownership of the pointer).
|
|
// Note: init_spacing should be called before calling this function.
|
|
void add_spacing(UNICHAR_ID uch_id, FontSpacingInfo *spacing_info) {
|
|
ASSERT_HOST(spacing_vec != NULL && spacing_vec->size() > uch_id);
|
|
(*spacing_vec)[uch_id] = spacing_info;
|
|
}
|
|
|
|
// Returns the pointer to FontSpacingInfo for the given UNICHAR_ID.
|
|
const FontSpacingInfo *get_spacing(UNICHAR_ID uch_id) const {
|
|
return (spacing_vec == NULL || spacing_vec->size() <= uch_id) ?
|
|
NULL : (*spacing_vec)[uch_id];
|
|
}
|
|
|
|
// Fills spacing with the value of the x gap expected between the two given
|
|
// UNICHAR_IDs. Returns true on success.
|
|
bool get_spacing(UNICHAR_ID prev_uch_id,
|
|
UNICHAR_ID uch_id,
|
|
int *spacing) const {
|
|
const FontSpacingInfo *prev_fsi = this->get_spacing(prev_uch_id);
|
|
const FontSpacingInfo *fsi = this->get_spacing(uch_id);
|
|
if (prev_fsi == NULL || fsi == NULL) return false;
|
|
int i = 0;
|
|
for (; i < prev_fsi->kerned_unichar_ids.size(); ++i) {
|
|
if (prev_fsi->kerned_unichar_ids[i] == uch_id) break;
|
|
}
|
|
if (i < prev_fsi->kerned_unichar_ids.size()) {
|
|
*spacing = prev_fsi->kerned_x_gaps[i];
|
|
} else {
|
|
*spacing = prev_fsi->x_gap_after + fsi->x_gap_before;
|
|
}
|
|
return true;
|
|
}
|
|
|
|
bool is_italic() const { return properties & 1; }
|
|
bool is_bold() const { return (properties & 2) != 0; }
|
|
bool is_fixed_pitch() const { return (properties & 4) != 0; }
|
|
bool is_serif() const { return (properties & 8) != 0; }
|
|
bool is_fraktur() const { return (properties & 16) != 0; }
|
|
|
|
char* name;
|
|
uinT32 properties;
|
|
// The universal_id is a field reserved for the initialization process
|
|
// to assign a unique id number to all fonts loaded for the current
|
|
// combination of languages. This id will then be returned by
|
|
// ResultIterator::WordFontAttributes.
|
|
inT32 universal_id;
|
|
// Horizontal spacing between characters (indexed by UNICHAR_ID).
|
|
GenericVector<FontSpacingInfo *> *spacing_vec;
|
|
};
|
|
|
|
// Every class (character) owns a FontSet that represents all the fonts that can
|
|
// render this character.
|
|
// Since almost all the characters from the same script share the same set of
|
|
// fonts, the sets are shared over multiple classes (see
|
|
// Classify::fontset_table_). Thus, a class only store an id to a set.
|
|
// Because some fonts cannot render just one character of a set, there are a
|
|
// lot of FontSet that differ only by one font. Rather than storing directly
|
|
// the FontInfo in the FontSet structure, it's better to share FontInfos among
|
|
// FontSets (Classify::fontinfo_table_).
|
|
struct FontSet {
|
|
int size;
|
|
int* configs; // FontInfo ids
|
|
};
|
|
|
|
// Class that adds a bit of functionality on top of GenericVector to
|
|
// implement a table of FontInfo that replaces UniCityTable<FontInfo>.
|
|
// TODO(rays) change all references once all existing traineddata files
|
|
// are replaced.
|
|
class FontInfoTable : public GenericVector<FontInfo> {
|
|
public:
|
|
FontInfoTable();
|
|
~FontInfoTable();
|
|
|
|
// Writes to the given file. Returns false in case of error.
|
|
bool Serialize(FILE* fp) const;
|
|
// Reads from the given file. Returns false in case of error.
|
|
// If swap is true, assumes a big/little-endian swap is needed.
|
|
bool DeSerialize(bool swap, FILE* fp);
|
|
|
|
// Returns true if the given set of fonts includes one with the same
|
|
// properties as font_id.
|
|
bool SetContainsFontProperties(
|
|
int font_id, const GenericVector<ScoredFont>& font_set) const;
|
|
// Returns true if the given set of fonts includes multiple properties.
|
|
bool SetContainsMultipleFontProperties(
|
|
const GenericVector<ScoredFont>& font_set) const;
|
|
|
|
// Moves any non-empty FontSpacingInfo entries from other to this.
|
|
void MoveSpacingInfoFrom(FontInfoTable* other);
|
|
// Moves this to the target unicity table.
|
|
void MoveTo(UnicityTable<FontInfo>* target);
|
|
};
|
|
|
|
// Compare FontInfo structures.
|
|
bool CompareFontInfo(const FontInfo& fi1, const FontInfo& fi2);
|
|
// Compare FontSet structures.
|
|
bool CompareFontSet(const FontSet& fs1, const FontSet& fs2);
|
|
// Deletion callbacks for GenericVector.
|
|
void FontInfoDeleteCallback(FontInfo f);
|
|
void FontSetDeleteCallback(FontSet fs);
|
|
|
|
// Callbacks used by UnicityTable to read/write FontInfo/FontSet structures.
|
|
bool read_info(FILE* f, FontInfo* fi, bool swap);
|
|
bool write_info(FILE* f, const FontInfo& fi);
|
|
bool read_spacing_info(FILE *f, FontInfo* fi, bool swap);
|
|
bool write_spacing_info(FILE* f, const FontInfo& fi);
|
|
bool read_set(FILE* f, FontSet* fs, bool swap);
|
|
bool write_set(FILE* f, const FontSet& fs);
|
|
|
|
} // namespace tesseract.
|
|
|
|
#endif /* THIRD_PARTY_TESSERACT_CCSTRUCT_FONTINFO_H_ */
|