-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathtinydict.h
206 lines (176 loc) · 5.24 KB
/
tinydict.h
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
/** \file tinydict.h
\brief .dict dictionary file support interface
Lightweight implementation of .dict support, written from scratch.
(c) Vadim Lopatin, 2009
This source code is distributed under the terms of
GNU General Public License.
See LICENSE file for details.
usage:
init:
// create TinyDictionaryList object
TinyDictionaryList dicts;
// register dictionaries using
dicts.add( "/dir1/dict1.index", "/dir1/dict1.dict.dz" );
dicts.add( "/dir1/dict2.index", "/dir1/dict2.dict.dz" );
search:
// container for results
TinyDictResultList results;
dicts.find(results, "word", 0 ); // find exact match
process results:
// for each source dictionary that matches pattern
for ( int d = 0; d<results.length(); d++ ) {
TinyDictWordList * words = results.get(d);
printf("dict: %s\n", words->getDictionaryName() );
// for each found word
for ( int i=0; i<words->length(); i++ ) {
TinyDictWord * word = words->get(i);
printf("word: %s\n", word->getWord() );
printf("article: %s\n", words->getArticle( i ) );
}
}
*/
#ifndef TINYDICT_H_INCLUDED
#define TINYDICT_H_INCLUDED
#include <stdlib.h>
#include <stdio.h>
#include <string.h>
#include <zlib.h>
/// dictinary data file forward declaration
class TinyDictDataFile;
/// dictionary index file forward declaration
class TinyDictIndexFile;
/// dictonary forward declaration
class TinyDictionary;
/// Word entry of index file
class TinyDictWord
{
unsigned index;
unsigned indexpos;
unsigned start;
unsigned size;
char * word;
TinyDictWord( unsigned _index, unsigned _indexpos, unsigned _start, unsigned _size, const char * _word )
: index(_index)
, indexpos(_indexpos)
, start(_start)
, size(_size)
, word( strdup(_word) )
{
}
public:
/// factory - reading from index file
static TinyDictWord * read( FILE * f, unsigned index );
// getters
unsigned getIndexPos() const { return indexpos; }
unsigned getIndex() const { return index; }
unsigned getStart() const { return start; }
unsigned getSize() const { return size; }
const char * getWord() const { return word; }
int compare( const char * str ) const;
bool match( const char * str, bool exact ) const;
~TinyDictWord() { if ( word ) free( word ); }
};
/// word entry list
class TinyDictWordList
{
TinyDictionary * dict;
TinyDictWord ** list;
int size;
int count;
public:
// article access functions
/// set dictonary pointer list belongs to
void setDict( TinyDictionary * p ) { dict = p; }
/// returns word list's dictionary name
const char * getDictionaryName();
/// returns article for word by index
const char * getArticle( int index );
// search functions
/// searches list position by prefix
int find( const char * prefix );
// word list functions
/// returns number of words in list
int length() { return count; }
/// get item by index
TinyDictWord * get( int index ) { return list[index]; }
/// add word to list
void add( TinyDictWord * word );
/// clear list
void clear();
/// empty list constructor
TinyDictWordList();
/// destructor
~TinyDictWordList();
};
/// default mode: exact match
#define TINY_DICT_OPTION_EXACT_MATCH 0
/// search for words starting with specified pattern
#define TINY_DICT_OPTION_STARTS_WITH 1
class TinyDictionary
{
char * name;
TinyDictDataFile * data;
TinyDictIndexFile * index;
public:
/// searches dictionary for specified word, caller is responsible for deleting of returned object
TinyDictWordList * find( const char * prefix, int options = 0 );
/// returns short dictionary name
const char * getDictionaryName();
/// get dictionary data pointer
TinyDictDataFile * getData() { return data; }
/// get dictionary index pointer
//TinyDictIndexFile * getIndex() { return index; }
/// minimize memory usage
void compact();
/// open dictonary from files
bool open( const char * indexfile, const char * datafile );
/// empty dictinary constructor
TinyDictionary();
/// destructor
~TinyDictionary();
};
/// dictionary search result list
class TinyDictResultList
{
TinyDictWordList ** list;
int size;
int count;
public:
// word list functions
/// returns number of words in list
int length() { return count; }
/// get item by index
TinyDictWordList * get( int index ) { return list[index]; }
/// remove all dictionaries from list
void clear();
/// create empty list
TinyDictResultList();
/// destructor
~TinyDictResultList();
/// add item to list
void add( TinyDictWordList * p );
};
/// dictionary list
class TinyDictionaryList
{
TinyDictionary ** list;
int size;
int count;
public:
/// search all dictionaries in list for specified pattern
bool find( TinyDictResultList & result, const char * prefix, int options = 0 );
// word list functions
/// returns number of words in list
int length() { return count; }
/// get item by index
TinyDictionary * get( int index ) { return list[index]; }
/// remove all dictionaries from list
void clear();
/// create empty list
TinyDictionaryList();
/// destructor
~TinyDictionaryList();
/// try to open dictionary and add it to list
bool add( const char * indexfile, const char * datafile );
};
#endif //TINYDICT_H_INCLUDED