mirror of
https://github.com/CCExtractor/ccextractor.git
synced 2024-12-25 20:32:10 +00:00
142 lines
7.0 KiB
C
142 lines
7.0 KiB
C
/*====================================================================*
|
|
- Copyright (C) 2001 Leptonica. All rights reserved.
|
|
-
|
|
- Redistribution and use in source and binary forms, with or without
|
|
- modification, are permitted provided that the following conditions
|
|
- are met:
|
|
- 1. Redistributions of source code must retain the above copyright
|
|
- notice, this list of conditions and the following disclaimer.
|
|
- 2. Redistributions in binary form must reproduce the above
|
|
- copyright notice, this list of conditions and the following
|
|
- disclaimer in the documentation and/or other materials
|
|
- provided with the distribution.
|
|
-
|
|
- THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
|
|
- ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
|
|
- LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
|
|
- A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL ANY
|
|
- CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
|
|
- EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
|
|
- PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
|
|
- PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY
|
|
- OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
|
|
- NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
|
|
- SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
|
*====================================================================*/
|
|
|
|
#ifndef LEPTONICA_JBCLASS_H
|
|
#define LEPTONICA_JBCLASS_H
|
|
|
|
/*!
|
|
* \file jbclass.h
|
|
*
|
|
* JbClasser
|
|
* JbData
|
|
*/
|
|
|
|
|
|
/*!
|
|
* <pre>
|
|
* The JbClasser struct holds all the data accumulated during the
|
|
* classification process that can be used for a compressed
|
|
* jbig2-type representation of a set of images. This is created
|
|
* in an initialization process and added to as the selected components
|
|
* on each successive page are analyzed.
|
|
* </pre>
|
|
*/
|
|
struct JbClasser
|
|
{
|
|
struct Sarray *safiles; /*!< input page image file names */
|
|
l_int32 method; /*!< JB_RANKHAUS, JB_CORRELATION */
|
|
l_int32 components; /*!< JB_CONN_COMPS, JB_CHARACTERS or */
|
|
/*!< JB_WORDS */
|
|
l_int32 maxwidth; /*!< max component width allowed */
|
|
l_int32 maxheight; /*!< max component height allowed */
|
|
l_int32 npages; /*!< number of pages already processed */
|
|
l_int32 baseindex; /*!< number components already processed */
|
|
/*!< on fully processed pages */
|
|
struct Numa *nacomps; /*!< number of components on each page */
|
|
l_int32 sizehaus; /*!< size of square struct elem for haus */
|
|
l_float32 rankhaus; /*!< rank val of haus match, each way */
|
|
l_float32 thresh; /*!< thresh value for correlation score */
|
|
l_float32 weightfactor; /*!< corrects thresh value for heaver */
|
|
/*!< components; use 0 for no correction */
|
|
struct Numa *naarea; /*!< w * h of each template, without */
|
|
/*!< extra border pixels */
|
|
l_int32 w; /*!< max width of original src images */
|
|
l_int32 h; /*!< max height of original src images */
|
|
l_int32 nclass; /*!< current number of classes */
|
|
l_int32 keep_pixaa; /*!< If zero, pixaa isn't filled */
|
|
struct Pixaa *pixaa; /*!< instances for each class; unbordered */
|
|
struct Pixa *pixat; /*!< templates for each class; bordered */
|
|
/*!< and not dilated */
|
|
struct Pixa *pixatd; /*!< templates for each class; bordered */
|
|
/*!< and dilated */
|
|
struct L_DnaHash *dahash; /*!< Hash table to find templates by size */
|
|
struct Numa *nafgt; /*!< fg areas of undilated templates; */
|
|
/*!< only used for rank < 1.0 */
|
|
struct Pta *ptac; /*!< centroids of all bordered cc */
|
|
struct Pta *ptact; /*!< centroids of all bordered template cc */
|
|
struct Numa *naclass; /*!< array of class ids for each component */
|
|
struct Numa *napage; /*!< array of page nums for each component */
|
|
struct Pta *ptaul; /*!< array of UL corners at which the */
|
|
/*!< template is to be placed for each */
|
|
/*!< component */
|
|
struct Pta *ptall; /*!< similar to ptaul, but for LL corners */
|
|
};
|
|
typedef struct JbClasser JBCLASSER;
|
|
|
|
|
|
/*!
|
|
* <pre>
|
|
* The JbData struct holds all the data required for
|
|
* the compressed jbig-type representation of a set of images.
|
|
* The data can be written to file, read back, and used
|
|
* to regenerate an approximate version of the original,
|
|
* which differs in two ways from the original:
|
|
* (1) It uses a template image for each c.c. instead of the
|
|
* original instance, for each occurrence on each page.
|
|
* (2) It discards components with either a height or width larger
|
|
* than the maximuma, given here by the lattice dimensions
|
|
* used for storing the templates.
|
|
* </pre>
|
|
*/
|
|
struct JbData
|
|
{
|
|
struct Pix *pix; /*!< template composite for all classes */
|
|
l_int32 npages; /*!< number of pages */
|
|
l_int32 w; /*!< max width of original page images */
|
|
l_int32 h; /*!< max height of original page images */
|
|
l_int32 nclass; /*!< number of classes */
|
|
l_int32 latticew; /*!< lattice width for template composite */
|
|
l_int32 latticeh; /*!< lattice height for template composite */
|
|
struct Numa *naclass; /*!< array of class ids for each component */
|
|
struct Numa *napage; /*!< array of page nums for each component */
|
|
struct Pta *ptaul; /*!< array of UL corners at which the */
|
|
/*!< template is to be placed for each */
|
|
/*!< component */
|
|
};
|
|
typedef struct JbData JBDATA;
|
|
|
|
|
|
/*! Classifier methods */
|
|
enum {
|
|
JB_RANKHAUS = 0,
|
|
JB_CORRELATION = 1
|
|
};
|
|
|
|
/*! For jbGetComponents(): type of component to extract from images */
|
|
enum {
|
|
JB_CONN_COMPS = 0,
|
|
JB_CHARACTERS = 1,
|
|
JB_WORDS = 2
|
|
};
|
|
|
|
/*! These parameters are used for naming the two files
|
|
* in which the jbig2-like compressed data is stored. */
|
|
#define JB_TEMPLATE_EXT ".templates.png"
|
|
#define JB_DATA_EXT ".data"
|
|
|
|
|
|
#endif /* LEPTONICA_JBCLASS_H */
|