/////////////////////////////////////////////////////////////////////// // File: pdfrenderer.cpp // Description: PDF rendering interface to inject into TessBaseAPI // // (C) Copyright 2011, Google Inc. // Licensed under the Apache License, Version 2.0 (the "License"); // you may not use this file except in compliance with the License. // You may obtain a copy of the License at // http://www.apache.org/licenses/LICENSE-2.0 // Unless required by applicable law or agreed to in writing, software // distributed under the License is distributed on an "AS IS" BASIS, // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. // See the License for the specific language governing permissions and // limitations under the License. // /////////////////////////////////////////////////////////////////////// // Include automatically generated configuration file if running autoconf. #ifdef HAVE_CONFIG_H #include "config_auto.h" #endif #include // std::unique_ptr #include "allheaders.h" #include "baseapi.h" #include "math.h" #include "renderer.h" #include "strngs.h" #include "tprintf.h" /* Design notes from Ken Sharp, with light editing. We think one solution is a font with a single glyph (.notdef) and a CIDToGIDMap which maps all the CIDs to 0. That map would then be stored as a stream in the PDF file, and when flate compressed should be pretty small. The font, of course, will be approximately the same size as the one you currently use. I'm working on such a font now, the CIDToGIDMap is trivial, you just create a stream object which contains 128k bytes (2 bytes per possible CID and your CIDs range from 0 to 65535) and where you currently have "/CIDToGIDMap /Identity" you would have "/CIDToGIDMap