1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
|
/**********************************************************************
** Copyright (C) 2000-2003 Trolltech AS. All rights reserved.
**
** This file is part of the TQt Assistant.
**
** This file may be distributed and/or modified under the terms of the
** GNU General Public License version 2 as published by the Free Software
** Foundation and appearing in the file LICENSE.GPL included in the
** packaging of this file.
**
** Licensees holding valid TQt Enterprise Edition or TQt Professional Edition
** licenses may use this file in accordance with the TQt Commercial License
** Agreement provided with the Software.
**
** This file is provided AS IS with NO WARRANTY OF ANY KIND, INCLUDING THE
** WARRANTY OF DESIGN, MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE.
**
** See http://www.trolltech.com/gpl/ for GPL licensing information.
** See http://www.trolltech.com/pricing.html or email [email protected] for
** information about TQt Commercial License Agreements.
**
** Contact [email protected] if any conditions of this licensing are
** not clear to you.
**
**********************************************************************/
#ifndef INDEX_H
#define INDEX_H
#include <tqstringlist.h>
#include "kvi_pointerhashtable.h"
#include "kvi_pointerlist.h"
#include "kvi_valuelist.h"
#include <tqdatastream.h>
#include <tqobject.h>
struct Document {
Document( int d, int f ) : docNumber( d ), frequency( f ) {}
Document() : docNumber( -1 ), frequency( 0 ) {}
bool operator==( const Document &doc ) const {
return docNumber == doc.docNumber;
}
bool operator<( const Document &doc ) const {
return frequency > doc.frequency;
}
bool operator<=( const Document &doc ) const {
return frequency >= doc.frequency;
}
bool operator>( const Document &doc ) const {
return frequency < doc.frequency;
}
TQ_INT16 docNumber;
TQ_INT16 frequency;
};
TQDataStream &operator>>( TQDataStream &s, Document &l );
TQDataStream &operator<<( TQDataStream &s, const Document &l );
class Index : public TQObject
{
TQ_OBJECT
public:
struct Entry {
Entry( int d ) { documents.append( Document( d, 1 ) ); }
Entry( KviValueList<Document> l ) : documents( l ) {}
KviValueList<Document> documents;
};
struct PosEntry {
PosEntry( int p ) { positions.append( p ); }
KviValueList<uint> positions;
};
Index( const TQString &dp, const TQString &hp );
Index( const TQStringList &dl, const TQString &hp );
void writeDict();
void readDict();
int makeIndex();
TQStringList query( const TQStringList&, const TQStringList&, const TQStringList& );
TQString getDocumentTitle( const TQString& );
void setDictionaryFile( const TQString& );
void setDocListFile( const TQString& );
void writeDocumentList();
void readDocumentList();
void setupDocumentList();
const TQStringList& documentList() { return docList; };
const TQStringList& titlesList() { return titleList; };
signals:
void indexingProgress( int );
private slots:
void setLastWinClosed();
private:
void parseDocument( const TQString&, int );
void insertInDict( const TQString&, int );
TQStringList getWildcardTerms( const TQString& );
TQStringList split( const TQString& );
KviValueList<Document> setupDummyTerm( const TQStringList& );
bool searchForPattern( const TQStringList&, const TQStringList&, const TQString& );
void buildMiniDict( const TQString& );
TQStringList docList;
TQStringList titleList;
KviPointerHashTable<TQString,Entry> dict;
KviPointerHashTable<TQString,PosEntry> miniDict;
uint wordNum;
TQString docPath;
TQString dictFile, docListFile;
bool alreadyHaveDocList;
bool lastWindowClosed;
};
struct Term {
Term( const TQString &t, int f, KviValueList<Document> l )
: term( t ), frequency( f ), documents( l ) {}
TQString term;
int frequency;
KviValueList<Document>documents;
};
#define TermList KviPointerList<Term>
#endif
|