summaryrefslogtreecommitdiffstats
path: root/kooka/ocrword.h
blob: 606acb9f9a1aa21f181dbb0ab1250268501b2ea1 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
/***************************************************************************
                      ocrword.h  - ocr-result word and wordlist
                             -------------------
    begin                : Fri 10 Jan 2003
    copyright            : (C) 2003 by Klaas Freitag
    email                : freitag@suse.de
 ***************************************************************************/

/***************************************************************************
 *                                                                         *
 *  This file may be distributed and/or modified under the terms of the    *
 *  GNU General Public License version 2 as published by the Free Software *
 *  Foundation and appearing in the file COPYING included in the           *
 *  packaging of this file.                                                *
 *
 *  As a special exception, permission is given to link this program       *
 *  with any version of the KADMOS ocr/icr engine of reRecognition GmbH,   *
 *  Kreuzlingen and distribute the resulting executable without            *
 *  including the source code for KADMOS in the source distribution.       *
 *
 *  As a special exception, permission is given to link this program       *
 *  with any edition of Qt, and distribute the resulting executable,       *
 *  without including the source code for Qt in the source distribution.   *
 *                                                                         *
 ***************************************************************************/

#ifndef _OCR_WORD_
#define _OCR_WORD_

#include <qstringlist.h>
#include <qvaluevector.h>
#include <qvaluelist.h>
#include <qrect.h>

class QString;
class QRect;


/* ==== ocrWord ====================================== */
class ocrWord : public QString
{
public:
    ocrWord(const QString& s);
    ocrWord();
    QStringList getAlternatives()
        { return m_alternatives; }

    void setAlternatives( const QString& s )
        { m_alternatives.append(s); }

    // QRect boundingRect();

    void setKnode( int k )
        { m_startKnode = k; }
    void setLine( int l )
        { m_line = l; }

    int getLine() const { return m_line; }
    int getKnode() const { return m_startKnode; }

    void setRect( const QRect& r )
        { m_position = r; }
    QRect rect()
        { return m_position; }

private:
    QStringList m_alternatives;
    int         m_startKnode;
    int         m_line;
    QRect       m_position;
};

/* ==== ocrWordList ====================================== */

/**
 * This represents a line of words in an ocr'ed document
 */
class ocrWordList : public QValueList<ocrWord>
{
public:
    ocrWordList();
    QStringList stringList();

    bool updateOCRWord( const QString& from, const QString& to );

    bool findFuzzyIndex( const QString& word, ocrWord& resWord );

    QRect wordListRect( );

    void setBlock( int b );
    int block() const { return m_block; }

private:
    int m_block;
};

/**
 * All lines of a block: A value vector containing as much as entries
 * as lines are available in a block. Needs to be resized acordingly.
 */
typedef QValueVector<ocrWordList> ocrBlock;

/**
 * Blocks taken together form the page.
 * Attention: Needs to be resized to the amount of blocks !!
 */
typedef QValueVector<ocrBlock> ocrBlockPage;

typedef QValueVector<QRect> rectList;

#endif