1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
|
/****************************************************************************
**
** Copyright (C) 1992-2005 Trolltech AS. All rights reserved.
**
** This file is part of the assistant application of the Qt Toolkit.
**
** This file may be distributed under the terms of the Q Public License
** as defined by Trolltech AS of Norway and appearing in the file
** LICENSE.QPL included in the packaging of this file.
**
** This file may be distributed and/or modified under the terms of the
** GNU General Public License version 2 as published by the Free Software
** Foundation and appearing in the file LICENSE.GPL included in the
** packaging of this file.
**
** See http://www.trolltech.com/pricing.html or email sales@trolltech.com for
** information about Qt Commercial License Agreements.
** See http://www.trolltech.com/qpl/ for QPL licensing information.
** See http://www.trolltech.com/gpl/ for GPL licensing information.
**
** Contact info@trolltech.com if any conditions of this licensing are
** not clear to you.
**
** This file is provided AS IS with NO WARRANTY OF ANY KIND, INCLUDING THE
** WARRANTY OF DESIGN, MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE.
**
****************************************************************************/
#ifndef INDEX_H
#define INDEX_H
#include <qstringlist.h>
#include <qhash.h>
#include <qdatastream.h>
#include <qobject.h>
#include <qlist.h>
#include <qfile.h>
#include <qvector.h>
struct Document {
Document( int d, int f ) : docNumber( d ), frequency( f ) {}
Document() : docNumber( -1 ), frequency( 0 ) {}
bool operator==( const Document &doc ) const {
return docNumber == doc.docNumber;
}
bool operator<( const Document &doc ) const {
return frequency > doc.frequency;
}
bool operator<=( const Document &doc ) const {
return frequency >= doc.frequency;
}
bool operator>( const Document &doc ) const {
return frequency < doc.frequency;
}
qint16 docNumber;
qint16 frequency;
};
QDataStream &operator>>( QDataStream &s, Document &l );
QDataStream &operator<<( QDataStream &s, const Document &l );
class Index : public QObject
{
Q_OBJECT
public:
struct Entry {
Entry( int d ) { documents.append( Document( d, 1 ) ); }
Entry( QVector<Document> l ) : documents( l ) {}
QVector<Document> documents;
};
struct PosEntry {
PosEntry( int p ) { positions.append( p ); }
QList<uint> positions;
};
Index( const QString &dp, const QString &hp );
Index( const QStringList &dl, const QString &hp );
void writeDict();
void readDict();
int makeIndex();
QStringList query( const QStringList&, const QStringList&, const QStringList& );
QString getDocumentTitle( const QString& );
void setDictionaryFile( const QString& );
void setDocListFile( const QString& );
signals:
void indexingProgress( int );
private slots:
void setLastWinClosed();
private:
void setupDocumentList();
void parseDocument( const QString&, int );
void insertInDict( const QString&, int );
void writeDocumentList();
void readDocumentList();
QStringList getWildcardTerms( const QString& );
QStringList split( const QString& );
QVector<Document> setupDummyTerm( const QStringList& );
bool searchForPattern( const QStringList&, const QStringList&, const QString& );
void buildMiniDict( const QString& );
QString getCharsetForDocument(QFile *);
QStringList docList;
QHash<QString, Entry*> dict;
QHash<QString, PosEntry*> miniDict;
uint wordNum;
QString docPath;
QString dictFile, docListFile;
bool alreadyHaveDocList;
bool lastWindowClosed;
};
#endif
|