1 | Unit SearchUnit;
|
---|
2 |
|
---|
3 | // NewView - a new OS/2 Help Viewer
|
---|
4 | // Copyright 2003 Aaron Lawrence (aaronl at consultant dot com)
|
---|
5 | // This software is released under the Gnu Public License - see readme.txt
|
---|
6 |
|
---|
7 | Interface
|
---|
8 |
|
---|
9 | // Contains code to search help files.
|
---|
10 |
|
---|
11 | uses
|
---|
12 | Classes,
|
---|
13 | HelpFile,
|
---|
14 | TextSearchQuery,
|
---|
15 | IPFFileFormatUnit;
|
---|
16 |
|
---|
17 | const
|
---|
18 | // match weightings
|
---|
19 | mwOnlyTitleWord = 200;
|
---|
20 | mwFirstTitleWord = 50;
|
---|
21 | mwTitleWord = 20;
|
---|
22 |
|
---|
23 | mwOnlyIndexWord = 100;
|
---|
24 | mwFirstIndexWord = 20;
|
---|
25 | mwIndexWord = 10;
|
---|
26 | mwTopicTextWord = 1;
|
---|
27 |
|
---|
28 | // best case match weighting of a word
|
---|
29 | mwExactWord = 20;
|
---|
30 |
|
---|
31 |
|
---|
32 | // note on weightings. The title/index weightings
|
---|
33 | // are multipled by word weightings.
|
---|
34 | // Topic text matches are equal to word weighting
|
---|
35 | // times word weighting.
|
---|
36 |
|
---|
37 | procedure SearchHelpFile( HelpFile: THelpFile;
|
---|
38 | Query: TTextSearchQuery;
|
---|
39 | Results: TList;
|
---|
40 | WordSequences: TList );
|
---|
41 |
|
---|
42 | // clear a lsit of word sequences (as produced by above)
|
---|
43 | procedure ClearWordSequences( WordSequences: TList;
|
---|
44 | DictionaryCount: longint );
|
---|
45 |
|
---|
46 | Implementation
|
---|
47 |
|
---|
48 | uses
|
---|
49 | SysUtils,
|
---|
50 | DebugUnit,
|
---|
51 | StringUtilsUnit,
|
---|
52 | HelpTopic;
|
---|
53 |
|
---|
54 | type
|
---|
55 | TSearchType = ( stGeneral, stStarts, stExactMatch, stEnds );
|
---|
56 |
|
---|
57 | procedure ClearWordSequence( WordSequence: TList;
|
---|
58 | DictionaryCount: longint );
|
---|
59 | var
|
---|
60 | StepIndex: longint;
|
---|
61 | DictionaryRelevances: UInt32ArrayPointer;
|
---|
62 | begin
|
---|
63 | for StepIndex := 0 to WordSequence.Count - 1 do
|
---|
64 | begin
|
---|
65 | DictionaryRelevances := WordSequence[ StepIndex ];
|
---|
66 | FreeUInt32Array( DictionaryRelevances, DictionaryCount );
|
---|
67 | end;
|
---|
68 | WordSequence.Clear;
|
---|
69 | end;
|
---|
70 |
|
---|
71 | procedure ClearWordSequences( WordSequence: TList;
|
---|
72 | DictionaryCount: longint );
|
---|
73 | var
|
---|
74 | SequenceIndex: longint;
|
---|
75 | WordSequence: TList;
|
---|
76 | begin
|
---|
77 | for SequenceIndex := 0 to WordSequences.Count - 1 do
|
---|
78 | begin
|
---|
79 | WordSequence := WordSequences[ SequenceIndex ];
|
---|
80 | ClearWordSequence( WordSequence,
|
---|
81 | DictionaryCount );
|
---|
82 | WordSequence.Destroy;
|
---|
83 | end;
|
---|
84 | WordSequences.Clear;
|
---|
85 | end;
|
---|
86 |
|
---|
87 |
|
---|
88 | // given a search word which is known to matche Reference word,
|
---|
89 | // return the relevance
|
---|
90 | function MatchedWordRelevance( const SearchWord: string;
|
---|
91 | const ReferenceWord: string ): longint;
|
---|
92 | begin
|
---|
93 | Result := mwExactWord
|
---|
94 | * Length( SearchWord )
|
---|
95 | div Length( ReferenceWord );
|
---|
96 | if Result = 0 then
|
---|
97 | Result := 1;
|
---|
98 | end;
|
---|
99 |
|
---|
100 | // Compares the given search word against the given
|
---|
101 | // reference word. Returns a value indicating how well the
|
---|
102 | // search word matches, 0 = not at all.
|
---|
103 | function CompareWord( const SearchWord: string;
|
---|
104 | const ReferenceWord: string ): longint;
|
---|
105 | var
|
---|
106 | OccurrencePos: longint;
|
---|
107 | begin
|
---|
108 | Result := 0;
|
---|
109 | OccurrencePos := CaseInsensitivePos( SearchWord, ReferenceWord );
|
---|
110 | if OccurrencePos = 0 then
|
---|
111 | begin
|
---|
112 | // no match
|
---|
113 | exit;
|
---|
114 | end;
|
---|
115 |
|
---|
116 | Result := MatchedWordRelevance( SearchWord, ReferenceWord );
|
---|
117 | end;
|
---|
118 |
|
---|
119 | // Search the help file dictionary for words that match
|
---|
120 | // the given search word. Partial matches are considered.
|
---|
121 | // Results returns the matching word indexes.
|
---|
122 | procedure SearchDictionary( HelpFile: THelpFile;
|
---|
123 | SearchWord: string;
|
---|
124 | Results: UInt32ArrayPointer );
|
---|
125 | var
|
---|
126 | tmpDictIndex: integer;
|
---|
127 | pDictWord: pstring;
|
---|
128 | begin
|
---|
129 | for tmpDictIndex := 0 to HelpFile.DictionaryCount - 1 do
|
---|
130 | begin
|
---|
131 | pDictWord := HelpFile.DictionaryWordPtrs[ tmpDictIndex ];
|
---|
132 | Results[ tmpDictIndex ] := CompareWord( SearchWord, pDictWord^ );
|
---|
133 | end;
|
---|
134 | end;
|
---|
135 |
|
---|
136 | // Search the help file dictionary for words that
|
---|
137 | // match the given search word exactly (except for case-insensitive)
|
---|
138 | procedure SearchDictionaryExact( HelpFile: THelpFile;
|
---|
139 | SearchWord: string;
|
---|
140 | Results: UInt32ArrayPointer );
|
---|
141 | var
|
---|
142 | DictIndex: integer;
|
---|
143 | pDictWord: pstring;
|
---|
144 | begin
|
---|
145 | FillUInt32Array( Results, HelpFile.DictionaryCount, 0 );
|
---|
146 |
|
---|
147 | for DictIndex := 0 to HelpFile.DictionaryCount - 1 do
|
---|
148 | begin
|
---|
149 | pDictWord := HelpFile.DictionaryWordPtrs[ DictIndex ];
|
---|
150 | if StrEqualIgnoringCase( SearchWord, pDictWord^ ) then
|
---|
151 | Results[ DictIndex ] := mwExactWord;
|
---|
152 | end;
|
---|
153 | end;
|
---|
154 |
|
---|
155 | // Search the help file dictionary for words that
|
---|
156 | // start with the given word
|
---|
157 | procedure SearchDictionaryStarts( HelpFile: THelpFile;
|
---|
158 | SearchWord: string;
|
---|
159 | Results: UInt32ArrayPointer );
|
---|
160 | var
|
---|
161 | DictIndex: integer;
|
---|
162 | DictWord: string;
|
---|
163 | begin
|
---|
164 | if IsLogAspectsEnabled(LogSearch) then
|
---|
165 | begin
|
---|
166 | LogEvent(LogSearch, ' calling SearchDictionaryStarts "' + SearchWord + '"');
|
---|
167 | end;
|
---|
168 |
|
---|
169 | FillUInt32Array( Results, HelpFile.DictionaryCount, 0 );
|
---|
170 |
|
---|
171 | for DictIndex := 0 to HelpFile.DictionaryCount - 1 do
|
---|
172 | begin
|
---|
173 | DictWord := HelpFile.DictionaryWords[ DictIndex ];
|
---|
174 | if StrStartsWithIgnoringCase(DictWord, SearchWord) then
|
---|
175 | begin
|
---|
176 | Results[ DictIndex ] := MatchedWordRelevance( SearchWord, DictWord )
|
---|
177 | end;
|
---|
178 | end;
|
---|
179 | end;
|
---|
180 |
|
---|
181 |
|
---|
182 | // Search the help file dictionary for words that
|
---|
183 | // end with the given word
|
---|
184 | procedure SearchDictionaryEnds( HelpFile: THelpFile;
|
---|
185 | SearchWord: string;
|
---|
186 | Results: UInt32ArrayPointer );
|
---|
187 | var
|
---|
188 | DictIndex: integer;
|
---|
189 | DictWord: string;
|
---|
190 | begin
|
---|
191 | if IsLogAspectsEnabled(LogSearch) then
|
---|
192 | begin
|
---|
193 | LogEvent(LogSearch, ' calling SearchDictionaryEnds for "' + SearchWord + '"');
|
---|
194 | end;
|
---|
195 | FillUInt32Array( Results, HelpFile.DictionaryCount, 0 );
|
---|
196 |
|
---|
197 | for DictIndex := 0 to HelpFile.DictionaryCount - 1 do
|
---|
198 | begin
|
---|
199 | DictWord := HelpFile.DictionaryWords[ DictIndex ];
|
---|
200 | if StrEndsWithIgnoringCase(DictWord, SearchWord ) then
|
---|
201 | begin
|
---|
202 | Results[ DictIndex ] := MatchedWordRelevance( SearchWord, DictWord );
|
---|
203 | end;
|
---|
204 | end;
|
---|
205 | end;
|
---|
206 |
|
---|
207 | // Search titles of topics for given searchword
|
---|
208 | procedure SearchTopicTitles( HelpFile: THelpFile;
|
---|
209 | SearchWord: string;
|
---|
210 | Results: UInt32ArrayPointer );
|
---|
211 | var
|
---|
212 | TopicIndex: longint;
|
---|
213 | pTitle: pstring;
|
---|
214 | TitleWord: string;
|
---|
215 | Topic: TTopic;
|
---|
216 | TitleWordIndex: longint;
|
---|
217 | WordRelevance: longint;
|
---|
218 | TitleWordRelevance: longint;
|
---|
219 | tmpTitleWords : TStringList;
|
---|
220 | i : integer;
|
---|
221 | begin
|
---|
222 | if IsLogAspectsEnabled(LogSearch) then
|
---|
223 | begin
|
---|
224 | LogEvent(LogSearch, ' calling SearchTopicTitles for "' + SearchWord + '"');
|
---|
225 | end;
|
---|
226 |
|
---|
227 | tmpTitleWords := TStringList.Create;
|
---|
228 |
|
---|
229 | // Search topic titles
|
---|
230 | for TopicIndex:= 0 to HelpFile.TopicCount - 1 do
|
---|
231 | begin
|
---|
232 | Topic:= HelpFile.Topics[ TopicIndex ];
|
---|
233 | pTitle:= Topic.TitlePtr;
|
---|
234 | TitleWordIndex := 0;
|
---|
235 |
|
---|
236 | tmpTitleWords.Clear;
|
---|
237 | StrExtractStringsQuoted(tmpTitleWords, pTitle^);
|
---|
238 |
|
---|
239 | for i := 0 to tmpTitleWords.count-1 do
|
---|
240 | begin
|
---|
241 | TitleWord := tmpTitleWords[i];
|
---|
242 |
|
---|
243 | WordRelevance := CompareWord( SearchWord, TitleWord );
|
---|
244 | if WordRelevance > 0 then
|
---|
245 | begin
|
---|
246 | if TitleWordIndex = 0 then
|
---|
247 | begin
|
---|
248 | // matching the first word is best
|
---|
249 | if i = tmpTitleWords.count-1 then
|
---|
250 | begin
|
---|
251 | // in fact it's the only word
|
---|
252 | TitleWordRelevance := mwOnlyTitleWord * WordRelevance
|
---|
253 | end
|
---|
254 | else
|
---|
255 | TitleWordRelevance := mwFirstTitleWord * WordRelevance
|
---|
256 | end
|
---|
257 | else
|
---|
258 | begin
|
---|
259 | TitleWordRelevance := mwTitleWord * WordRelevance;
|
---|
260 | end;
|
---|
261 | inc( Results[ TopicIndex ],
|
---|
262 | TitleWordRelevance );
|
---|
263 | end;
|
---|
264 | inc( TitleWordIndex );
|
---|
265 | end;
|
---|
266 | end;
|
---|
267 | tmpTitleWords.Destroy;
|
---|
268 | end;
|
---|
269 |
|
---|
270 | // Search index entries for given searchword
|
---|
271 | procedure SearchIndex( HelpFile: THelpFile;
|
---|
272 | SearchWord: string;
|
---|
273 | Results: UInt32ArrayPointer );
|
---|
274 | var
|
---|
275 | IndexIndex: longint;
|
---|
276 | pIndexEntry: pstring;
|
---|
277 | IndexEntryWord: string;
|
---|
278 | Topic: TTopic;
|
---|
279 | IndexEntryWordIndex: longint;
|
---|
280 | WordRelevance: longint;
|
---|
281 | IndexEntryWordRelevance: longint;
|
---|
282 | tmpIndexWords : TStringList;
|
---|
283 | i : integer;
|
---|
284 | begin
|
---|
285 | if IsLogAspectsEnabled(LogSearch) then
|
---|
286 | begin
|
---|
287 | LogEvent(LogSearch, ' calling SearchIndex for "' + SearchWord + '"');
|
---|
288 | end;
|
---|
289 |
|
---|
290 | tmpIndexWords := TStringList.Create;
|
---|
291 |
|
---|
292 | for IndexIndex := 0 to HelpFile.Index.Count - 1 do
|
---|
293 | begin
|
---|
294 | Topic := HelpFile.Index.Objects[ IndexIndex ] as TTopic;
|
---|
295 | pIndexEntry := HelpFile.IndexEntryPtr[ IndexIndex ];
|
---|
296 | IndexEntryWordIndex := 0;
|
---|
297 |
|
---|
298 | tmpIndexWords.Clear;
|
---|
299 | StrExtractStringsQuoted(tmpIndexWords, pIndexEntry^);
|
---|
300 |
|
---|
301 | for i := 0 to tmpIndexWords.count-1 do
|
---|
302 | begin
|
---|
303 | IndexEntryWord := tmpIndexWords[i];
|
---|
304 |
|
---|
305 | WordRelevance := CompareWord( SearchWord, IndexEntryWord );
|
---|
306 | if WordRelevance > 0 then
|
---|
307 | begin
|
---|
308 | if IndexEntryWordIndex = 0 then
|
---|
309 | begin
|
---|
310 | // matching the first word is best
|
---|
311 | if i = tmpIndexWords.count-1 then
|
---|
312 | begin
|
---|
313 | // in fact it's the only word
|
---|
314 | IndexEntryWordRelevance := mwOnlyIndexWord * WordRelevance
|
---|
315 | end
|
---|
316 | else
|
---|
317 | IndexEntryWordRelevance := mwFirstIndexWord * WordRelevance
|
---|
318 | end
|
---|
319 | else
|
---|
320 | begin
|
---|
321 | IndexEntryWordRelevance := mwIndexWord * WordRelevance;
|
---|
322 | end;
|
---|
323 | inc( Results[ Topic.Index ],
|
---|
324 | IndexEntryWordRelevance );
|
---|
325 | end;
|
---|
326 | inc( IndexEntryWordIndex );
|
---|
327 | end;
|
---|
328 | end;
|
---|
329 |
|
---|
330 | tmpIndexWords.Destroy;
|
---|
331 | end;
|
---|
332 |
|
---|
333 | // ------------------------------------------------------
|
---|
334 |
|
---|
335 | // Master search function. Given a search query,
|
---|
336 | // searches topic text, titles, index entries.
|
---|
337 | // Matching topics are added to TList, with their
|
---|
338 | // SearchRelevance set appropriately.
|
---|
339 | procedure SearchHelpFile( HelpFile: THelpFile;
|
---|
340 | Query: TTextSearchQuery;
|
---|
341 | Results: TList;
|
---|
342 | WordSequences: TList );
|
---|
343 | var
|
---|
344 | tmpTopicCount: longint;
|
---|
345 | tmpTopic: TTopic;
|
---|
346 | tmpTopicIndex: longint;
|
---|
347 | tmpTermIndex: longint;
|
---|
348 | tmpTerm: TSearchTerm;
|
---|
349 |
|
---|
350 | DictionaryRelevances: UInt32ArrayPointer;
|
---|
351 |
|
---|
352 | TopicsMatchingDictWord: UInt32ArrayPointer; // flags
|
---|
353 | TopicsMatchingTermPart: UInt32ArrayPointer; // flags
|
---|
354 | TopicsMatchingTerm: UInt32ArrayPointer; // flag then relevances
|
---|
355 | TopicRelevances: UInt32ArrayPointer;
|
---|
356 | TopicsExcluded: UInt32ArrayPointer;
|
---|
357 |
|
---|
358 | TopicRelevanceForTerm: longint;
|
---|
359 |
|
---|
360 | WordRelevance: longint;
|
---|
361 | DictIndex: longint;
|
---|
362 |
|
---|
363 | TermPartIndex: longint;
|
---|
364 | TermPart: string;
|
---|
365 |
|
---|
366 | s: string;
|
---|
367 |
|
---|
368 | TermWordSequence: TList;
|
---|
369 | begin
|
---|
370 | LogEvent(LogSearch, 'SearchHelpFile');
|
---|
371 | Query.Log;
|
---|
372 |
|
---|
373 | if HelpFile.SearchTable = nil then
|
---|
374 | begin
|
---|
375 | exit;
|
---|
376 | end;
|
---|
377 |
|
---|
378 | // Reset flags per topic
|
---|
379 | tmpTopicCount := HelpFile.TopicCount;
|
---|
380 |
|
---|
381 | // Get memory for topic relevance arrays
|
---|
382 |
|
---|
383 | AllocUInt32Array( TopicsMatchingDictWord, tmpTopicCount );
|
---|
384 | AllocUInt32Array( TopicsMatchingTermPart, tmpTopicCount );
|
---|
385 | AllocUInt32Array( TopicsMatchingTerm, tmpTopicCount );
|
---|
386 | AllocUInt32Array( TopicRelevances, tmpTopicCount ); // functions as a flag and a cumulative relevance
|
---|
387 |
|
---|
388 | AllocUInt32Array( TopicsExcluded, tmpTopicCount ); // Exclusions are treated as boolean only
|
---|
389 |
|
---|
390 |
|
---|
391 | ClearUInt32Array( TopicRelevances, tmpTopicCount );
|
---|
392 | ClearUInt32Array( TopicsExcluded, tmpTopicCount );
|
---|
393 |
|
---|
394 | for tmpTermIndex := 0 to Query.TermCount - 1 do
|
---|
395 | begin
|
---|
396 | tmpTerm := Query.Term[ tmpTermIndex ];
|
---|
397 |
|
---|
398 | if IsLogAspectsEnabled(LogSearch) then
|
---|
399 | begin
|
---|
400 | LogEvent(LogSearch, 'Searching for term "'
|
---|
401 | + tmpTerm.Text
|
---|
402 | + '", '
|
---|
403 | + IntToStr( tmpTerm.Parts.Count )
|
---|
404 | + ' parts' );
|
---|
405 | end;
|
---|
406 |
|
---|
407 | // look thru all parts of the term. eg. CAKE_SAUSAGE
|
---|
408 |
|
---|
409 | TermWordSequence := TList.Create;
|
---|
410 |
|
---|
411 | if WordSequences <> nil then
|
---|
412 | if tmpTerm.CombineMethod <> cmExcluded then
|
---|
413 | begin
|
---|
414 | // this term is an inclusive one, so we want to remember the matches
|
---|
415 | WordSequences.Add( TermWordSequence );
|
---|
416 | end;
|
---|
417 |
|
---|
418 | for TermPartIndex := 0 to tmpTerm.Parts.Count - 1 do
|
---|
419 | begin
|
---|
420 | TermPart := tmpTerm.Parts[ TermPartIndex ];
|
---|
421 |
|
---|
422 | if IsLogAspectsEnabled(LogSearch) then
|
---|
423 | begin
|
---|
424 | LogEvent(LogSearch, ' Searching for TermPart [' + TermPart + ']' );
|
---|
425 | end;
|
---|
426 |
|
---|
427 | AllocUInt32Array( DictionaryRelevances, HelpFile.DictionaryCount );
|
---|
428 |
|
---|
429 | TermWordSequence.Add( DictionaryRelevances );
|
---|
430 |
|
---|
431 | // Search the dictionary for matches.
|
---|
432 | // alpha numeric match
|
---|
433 |
|
---|
434 | if tmpTerm.Parts.Count = 1 then
|
---|
435 | begin
|
---|
436 | if IsLogAspectsEnabled(LogSearch) then
|
---|
437 | begin
|
---|
438 | LogEvent(LogSearch, ' Term has only one part...' );
|
---|
439 | LogEvent(LogSearch, ' SearchDictionary [' + TermPart + ']' );
|
---|
440 | end;
|
---|
441 |
|
---|
442 | // general match allowing all kinds of partial matches
|
---|
443 | SearchDictionary( HelpFile, TermPart, DictionaryRelevances )
|
---|
444 | end
|
---|
445 |
|
---|
446 | else if TermPartIndex = 0 then
|
---|
447 | begin
|
---|
448 | if IsLogAspectsEnabled(LogSearch) then
|
---|
449 | begin
|
---|
450 | LogEvent(LogSearch, ' Term has more then one part... we are at first' );
|
---|
451 | LogEvent(LogSearch, ' SearchDictionaryEnd [' + TermPart + ']' );
|
---|
452 | end;
|
---|
453 |
|
---|
454 | // first term part: word must match end of a topic word e.g. must end in "cake"
|
---|
455 | SearchDictionaryEnds( HelpFile, TermPart, DictionaryRelevances )
|
---|
456 | end
|
---|
457 |
|
---|
458 | else if TermPartIndex = tmpTerm.Parts.Count - 1 then
|
---|
459 | begin
|
---|
460 | if IsLogAspectsEnabled(LogSearch) then
|
---|
461 | begin
|
---|
462 | LogEvent(LogSearch, ' Term has more then one part... we are at last' );
|
---|
463 | LogEvent(LogSearch, ' SearchDictionaryEnd [' + TermPart + ']' );
|
---|
464 | end;
|
---|
465 |
|
---|
466 | // last term part: word must match start of a topic word e.g. must start with "sausage"
|
---|
467 | SearchDictionaryStarts( HelpFile, TermPart, DictionaryRelevances )
|
---|
468 | end
|
---|
469 |
|
---|
470 | else
|
---|
471 | begin
|
---|
472 | if IsLogAspectsEnabled(LogSearch) then
|
---|
473 | begin
|
---|
474 | LogEvent(LogSearch, ' Term has more then one part... we are inside' );
|
---|
475 | LogEvent(LogSearch, ' SearchDictionaryEnd [' + TermPart + ']' );
|
---|
476 | end;
|
---|
477 |
|
---|
478 | // intermediate term part: word must match exactly e.g. must be "_"
|
---|
479 | SearchDictionaryExact( HelpFile, TermPart, DictionaryRelevances )
|
---|
480 | end;
|
---|
481 |
|
---|
482 | // For each word in the dictionary that matches
|
---|
483 | // this search term part, search topic texts
|
---|
484 |
|
---|
485 | LogEvent(LogSearch, ' Dictionary search done' );
|
---|
486 | ClearUInt32Array( TopicsMatchingTermPart, tmpTopicCount );
|
---|
487 |
|
---|
488 | for DictIndex := 0 to HelpFile.DictionaryCount - 1 do
|
---|
489 | begin
|
---|
490 | WordRelevance := DictionaryRelevances[ DictIndex ];
|
---|
491 | if WordRelevance > 0 then
|
---|
492 | begin
|
---|
493 | // Search for occurrences of this word
|
---|
494 | // within the text of topics
|
---|
495 | HelpFile.SearchTable.Search( DictIndex,
|
---|
496 | TopicsMatchingDictWord );
|
---|
497 |
|
---|
498 | // debug
|
---|
499 | s := HelpFile.DictionaryWords[ DictIndex ];
|
---|
500 | // TopicRelevancesForDictWord now contains 1
|
---|
501 | // for topics that contain this word.
|
---|
502 |
|
---|
503 | OrUInt32Array( TopicsMatchingDictWord,
|
---|
504 | TopicsMatchingTermPart,
|
---|
505 | tmpTopicCount );
|
---|
506 | end
|
---|
507 | end;
|
---|
508 |
|
---|
509 | LogEvent(LogSearch, ' Topic searches done' );
|
---|
510 |
|
---|
511 | if TermPartIndex = 0 then
|
---|
512 | // first part, just copy
|
---|
513 | CopyUInt32Array( TopicsMatchingTermPart,
|
---|
514 | TopicsMatchingTerm,
|
---|
515 | tmpTopicCount )
|
---|
516 | else
|
---|
517 | // and with previous term part results
|
---|
518 | AndUInt32Array( TopicsMatchingTermPart,
|
---|
519 | TopicsMatchingTerm,
|
---|
520 | tmpTopicCount );
|
---|
521 |
|
---|
522 | // loop for next term part (IPF word)
|
---|
523 | end;
|
---|
524 |
|
---|
525 | // Now we have searched the dictionary and worked out matching topics
|
---|
526 | // for all parts of the term. Now combine all together
|
---|
527 |
|
---|
528 | LogEvent(LogSearch, 'Checking for sequences' );
|
---|
529 | for tmpTopicIndex := 0 to tmpTopicCount - 1 do
|
---|
530 | begin
|
---|
531 | if TopicsMatchingTerm[ tmpTopicIndex ] > 0 then
|
---|
532 | begin
|
---|
533 | tmpTopic := HelpFile.Topics[ tmpTopicIndex ];
|
---|
534 | // Topic text contained a match for the all the parts
|
---|
535 | // of the term.
|
---|
536 | // Now we need to:
|
---|
537 | // - verify that they actually occur all in a sequence (if it's a multi-part term)
|
---|
538 | // - count occurrences for relevance.
|
---|
539 |
|
---|
540 | TopicRelevanceForTerm := tmpTopic.SearchForWordSequences( TermWordSequence, false ); // don't stop at first match
|
---|
541 |
|
---|
542 | TopicRelevanceForTerm := TopicRelevanceForTerm div tmpTerm.Parts.Count; // divide to bring back into scale
|
---|
543 |
|
---|
544 | TopicsMatchingTerm[ tmpTopicIndex ] := TopicRelevanceForTerm;
|
---|
545 |
|
---|
546 | end;
|
---|
547 | end;
|
---|
548 |
|
---|
549 | if WordSequences = nil then
|
---|
550 | begin
|
---|
551 | // we don't need to keep the sequence
|
---|
552 | ClearWordSequence( TermWordSequence,
|
---|
553 | HelpFile.DictionaryCount );
|
---|
554 | TermWordSequence.Destroy;
|
---|
555 | end;
|
---|
556 |
|
---|
557 | // Search titles and index
|
---|
558 |
|
---|
559 | LogEvent(LogSearch, ' Searching titles' );
|
---|
560 | SearchTopicTitles( HelpFile, tmpTerm.Text, TopicsMatchingTerm );
|
---|
561 |
|
---|
562 | LogEvent(LogSearch, ' Searching index' );
|
---|
563 | SearchIndex( HelpFile, tmpTerm.Text, TopicsMatchingTerm );
|
---|
564 |
|
---|
565 | LogEvent(LogSearch, ' Combining' );
|
---|
566 | case tmpTerm.CombineMethod of
|
---|
567 | cmOptional:
|
---|
568 | begin
|
---|
569 | LogEvent(LogSearch, ' Combining optional');
|
---|
570 | AddUInt32Array( TopicsMatchingTerm,
|
---|
571 | TopicRelevances,
|
---|
572 | tmpTopicCount );
|
---|
573 | end;
|
---|
574 |
|
---|
575 | cmRequired:
|
---|
576 | begin
|
---|
577 | LogEvent(LogSearch, ' Combining required');
|
---|
578 | // if zero then add to exclusions
|
---|
579 | NotOrUInt32Array( TopicsMatchingTerm,
|
---|
580 | TopicsExcluded,
|
---|
581 | tmpTopicCount );
|
---|
582 |
|
---|
583 | AddUInt32Array( TopicsMatchingTerm,
|
---|
584 | TopicRelevances,
|
---|
585 | tmpTopicCount );
|
---|
586 | end;
|
---|
587 |
|
---|
588 | cmExcluded:
|
---|
589 | begin
|
---|
590 | LogEvent(LogSearch, ' Combining excluded');
|
---|
591 | OrUInt32Array( TopicsMatchingTerm,
|
---|
592 | TopicsExcluded,
|
---|
593 | tmpTopicCount );
|
---|
594 | end;
|
---|
595 | end;
|
---|
596 |
|
---|
597 | // Term.ClearMatches;
|
---|
598 |
|
---|
599 | // loop for next term...
|
---|
600 | end;
|
---|
601 |
|
---|
602 | LogEvent(LogSearch, 'Search completed, converting to list' );
|
---|
603 |
|
---|
604 | // Now convert to list form.
|
---|
605 |
|
---|
606 | for tmpTopicIndex := 0 to tmpTopicCount - 1 do
|
---|
607 | begin
|
---|
608 | if TopicsExcluded[ tmpTopicIndex ] = 0 then
|
---|
609 | begin
|
---|
610 | tmpTopic := HelpFile.Topics[ tmpTopicIndex ];
|
---|
611 | tmpTopic.SearchRelevance := TopicRelevances[ tmpTopicIndex ];
|
---|
612 | if tmpTopic.SearchRelevance > 0 then
|
---|
613 | begin
|
---|
614 | Results.Add( tmpTopic );
|
---|
615 | end;
|
---|
616 | end;
|
---|
617 | end;
|
---|
618 |
|
---|
619 | LogEvent(LogSearch, 'Freeing arrays' );
|
---|
620 | FreeUInt32Array( TopicRelevances, tmpTopicCount );
|
---|
621 | FreeUInt32Array( TopicsExcluded, tmpTopicCount );
|
---|
622 | FreeUInt32Array( TopicsMatchingTerm, tmpTopicCount );
|
---|
623 | FreeUInt32Array( TopicsMatchingTermPart, tmpTopicCount );
|
---|
624 | FreeUInt32Array( TopicsMatchingDictWord, tmpTopicCount );
|
---|
625 |
|
---|
626 | LogEvent(LogSearch, 'Done' );
|
---|
627 | end;
|
---|
628 |
|
---|
629 | Initialization
|
---|
630 | End.
|
---|