2010-09-30 10:06:29 +08:00
|
|
|
<?xml version="1.0" encoding="UTF-8"?>
|
|
|
|
<!DOCTYPE refentry PUBLIC "-//OASIS//DTD DocBook XML V4.5//EN" "http://www.oasis-open.org/docbook/xml/4.5/docbookx.dtd">
|
|
|
|
<?asciidoc-toc?>
|
|
|
|
<?asciidoc-numbered?>
|
|
|
|
<refentry lang="en">
|
|
|
|
<refmeta>
|
|
|
|
<refentrytitle>cntraining</refentrytitle>
|
|
|
|
<manvolnum>1</manvolnum>
|
|
|
|
<refmiscinfo class="source"> </refmiscinfo>
|
|
|
|
<refmiscinfo class="manual"> </refmiscinfo>
|
|
|
|
</refmeta>
|
|
|
|
<refnamediv>
|
|
|
|
<refname>cntraining</refname>
|
|
|
|
<refpurpose>character normalization training for Tesseract</refpurpose>
|
|
|
|
</refnamediv>
|
|
|
|
<refsynopsisdiv id="_synopsis">
|
2012-02-10 06:55:47 +08:00
|
|
|
<simpara><emphasis role="strong">cntraining</emphasis> [-D <emphasis>dir</emphasis>] <emphasis>FILE</emphasis>…</simpara>
|
2010-09-30 10:06:29 +08:00
|
|
|
</refsynopsisdiv>
|
|
|
|
<refsect1 id="_description">
|
|
|
|
<title>DESCRIPTION</title>
|
|
|
|
<simpara>cntraining takes a list of .tr files, from which it generates the
|
2012-02-10 06:55:47 +08:00
|
|
|
<emphasis role="strong">normproto</emphasis> data file (the character normalization sensitivity
|
|
|
|
prototypes).</simpara>
|
|
|
|
</refsect1>
|
|
|
|
<refsect1 id="_options">
|
|
|
|
<title>OPTIONS</title>
|
|
|
|
<variablelist>
|
|
|
|
<varlistentry>
|
|
|
|
<term>
|
|
|
|
-D <emphasis>dir</emphasis>
|
|
|
|
</term>
|
|
|
|
<listitem>
|
|
|
|
<simpara>
|
|
|
|
Directory to write output files to.
|
|
|
|
</simpara>
|
|
|
|
</listitem>
|
|
|
|
</varlistentry>
|
|
|
|
</variablelist>
|
2010-09-30 10:06:29 +08:00
|
|
|
</refsect1>
|
|
|
|
<refsect1 id="_see_also">
|
|
|
|
<title>SEE ALSO</title>
|
2012-02-10 06:55:47 +08:00
|
|
|
<simpara>tesseract(1), shapeclustering(1), mftraining(1)</simpara>
|
2010-09-30 10:06:29 +08:00
|
|
|
<simpara><ulink url="http://code.google.com/p/tesseract-ocr/wiki/TrainingTesseract3">http://code.google.com/p/tesseract-ocr/wiki/TrainingTesseract3</ulink></simpara>
|
|
|
|
</refsect1>
|
|
|
|
<refsect1 id="_copying">
|
|
|
|
<title>COPYING</title>
|
|
|
|
<simpara>Copyright (c) Hewlett-Packard Company, 1988
|
|
|
|
Licensed under the Apache License, Version 2.0</simpara>
|
|
|
|
</refsect1>
|
2012-02-10 06:55:47 +08:00
|
|
|
<refsect1 id="_author">
|
|
|
|
<title>AUTHOR</title>
|
|
|
|
<simpara>The Tesseract OCR engine was written by Ray Smith and his research groups
|
|
|
|
at Hewlett Packard (1985-1995) and Google (2006-present).</simpara>
|
|
|
|
</refsect1>
|
2010-09-30 10:06:29 +08:00
|
|
|
</refentry>
|