]>
Commit | Line | Data |
---|---|---|
8ec2b484 | 1 | ///////////////////////////////////////////////////////////////////////////// |
93763ad5 | 2 | // Name: src/html/helpdata.cpp |
8ec2b484 | 3 | // Purpose: wxHtmlHelpData |
f42b1601 | 4 | // Notes: Based on htmlhelp.cpp, implementing a monolithic |
8ec2b484 HH |
5 | // HTML Help controller class, by Vaclav Slavik |
6 | // Author: Harm van der Heijden and Vaclav Slavik | |
69941f05 | 7 | // RCS-ID: $Id$ |
8ec2b484 | 8 | // Copyright: (c) Harm van der Heijden and Vaclav Slavik |
65571936 | 9 | // Licence: wxWindows licence |
8ec2b484 HH |
10 | ///////////////////////////////////////////////////////////////////////////// |
11 | ||
8ec2b484 HH |
12 | // For compilers that support precompilation, includes "wx.h". |
13 | #include "wx/wxprec.h" | |
14 | ||
15 | #ifdef __BORLANDC__ | |
93763ad5 | 16 | #pragma hdrstop |
8ec2b484 HH |
17 | #endif |
18 | ||
f6bcfd97 | 19 | #if wxUSE_HTML && wxUSE_STREAMS |
8ec2b484 HH |
20 | |
21 | #ifndef WXPRECOMP | |
04dbb646 VZ |
22 | #include "wx/intl.h" |
23 | #include "wx/log.h" | |
8ec2b484 HH |
24 | #endif |
25 | ||
401eb3de RR |
26 | #include <ctype.h> |
27 | ||
8ec2b484 HH |
28 | #include "wx/html/helpdata.h" |
29 | #include "wx/tokenzr.h" | |
30 | #include "wx/wfstream.h" | |
31 | #include "wx/busyinfo.h" | |
f890e2d4 VS |
32 | #include "wx/encconv.h" |
33 | #include "wx/fontmap.h" | |
69941f05 | 34 | #include "wx/html/htmlpars.h" |
8ec2b484 | 35 | #include "wx/html/htmldefs.h" |
2b5f62a0 | 36 | #include "wx/html/htmlfilt.h" |
057b55b0 | 37 | #include "wx/filename.h" |
8ec2b484 HH |
38 | |
39 | #include "wx/arrimpl.cpp" | |
40 | WX_DEFINE_OBJARRAY(wxHtmlBookRecArray) | |
91fa114d | 41 | WX_DEFINE_OBJARRAY(wxHtmlHelpDataItems) |
8ec2b484 HH |
42 | |
43 | //----------------------------------------------------------------------------- | |
44 | // static helper functions | |
45 | //----------------------------------------------------------------------------- | |
46 | ||
47 | // Reads one line, stores it into buf and returns pointer to new line or NULL. | |
1a1dac18 | 48 | static const wxChar* ReadLine(const wxChar *line, wxChar *buf, size_t bufsize) |
8ec2b484 | 49 | { |
1a1dac18 MB |
50 | wxChar *writeptr = buf; |
51 | wxChar *endptr = buf + bufsize - 1; | |
52 | const wxChar *readptr = line; | |
8ec2b484 | 53 | |
1a1dac18 | 54 | while (*readptr != 0 && *readptr != _T('\r') && *readptr != _T('\n') && |
d1da8872 | 55 | writeptr != endptr) |
3dde6c72 | 56 | *(writeptr++) = *(readptr++); |
8ec2b484 | 57 | *writeptr = 0; |
1a1dac18 | 58 | while (*readptr == _T('\r') || *readptr == _T('\n')) |
3dde6c72 VS |
59 | readptr++; |
60 | if (*readptr == 0) | |
61 | return NULL; | |
d1da8872 | 62 | else |
3dde6c72 | 63 | return readptr; |
8ec2b484 HH |
64 | } |
65 | ||
66 | ||
8ec2b484 | 67 | |
91fa114d VS |
68 | static int |
69 | wxHtmlHelpIndexCompareFunc(wxHtmlHelpDataItem **a, wxHtmlHelpDataItem **b) | |
8ec2b484 | 70 | { |
91fa114d VS |
71 | wxHtmlHelpDataItem *ia = *a; |
72 | wxHtmlHelpDataItem *ib = *b; | |
3912b3f8 | 73 | |
7fbe5489 VS |
74 | if (ia == NULL) |
75 | return -1; | |
76 | if (ib == NULL) | |
77 | return 1; | |
42841dfc | 78 | |
91fa114d VS |
79 | if (ia->parent == ib->parent) |
80 | { | |
81 | return ia->name.CmpNoCase(ib->name); | |
82 | } | |
83 | else if (ia->level == ib->level) | |
84 | { | |
85 | return wxHtmlHelpIndexCompareFunc(&ia->parent, &ib->parent); | |
86 | } | |
87 | else | |
88 | { | |
89 | wxHtmlHelpDataItem *ia2 = ia; | |
90 | wxHtmlHelpDataItem *ib2 = ib; | |
d1da8872 | 91 | |
91fa114d VS |
92 | while (ia2->level > ib2->level) |
93 | { | |
94 | ia2 = ia2->parent; | |
95 | } | |
96 | while (ib2->level > ia2->level) | |
97 | { | |
98 | ib2 = ib2->parent; | |
99 | } | |
d1da8872 | 100 | |
91fa114d VS |
101 | wxASSERT(ia2); |
102 | wxASSERT(ib2); | |
103 | int res = wxHtmlHelpIndexCompareFunc(&ia2, &ib2); | |
104 | if (res != 0) | |
105 | return res; | |
106 | else if (ia->level > ib->level) | |
107 | return 1; | |
108 | else | |
109 | return -1; | |
110 | } | |
8ec2b484 HH |
111 | } |
112 | ||
8ec2b484 HH |
113 | //----------------------------------------------------------------------------- |
114 | // HP_Parser | |
115 | //----------------------------------------------------------------------------- | |
116 | ||
117 | class HP_Parser : public wxHtmlParser | |
118 | { | |
211dfedd | 119 | public: |
67c276bd VS |
120 | HP_Parser() |
121 | { | |
122 | GetEntitiesParser()->SetEncoding(wxFONTENCODING_ISO8859_1); | |
123 | } | |
fc7a2a60 | 124 | |
211dfedd | 125 | wxObject* GetProduct() { return NULL; } |
fc7a2a60 | 126 | |
211dfedd VS |
127 | protected: |
128 | virtual void AddText(const wxChar* WXUNUSED(txt)) {} | |
fc7a2a60 VZ |
129 | |
130 | DECLARE_NO_COPY_CLASS(HP_Parser) | |
8ec2b484 HH |
131 | }; |
132 | ||
133 | ||
134 | //----------------------------------------------------------------------------- | |
135 | // HP_TagHandler | |
136 | //----------------------------------------------------------------------------- | |
137 | ||
138 | class HP_TagHandler : public wxHtmlTagHandler | |
139 | { | |
140 | private: | |
91fa114d VS |
141 | wxString m_name, m_page; |
142 | int m_level; | |
143 | int m_id; | |
144 | int m_index; | |
145 | int m_count; | |
146 | wxHtmlHelpDataItem *m_parentItem; | |
147 | wxHtmlBookRecord *m_book; | |
d1da8872 | 148 | |
91fa114d | 149 | wxHtmlHelpDataItems *m_data; |
8ec2b484 HH |
150 | |
151 | public: | |
04dbb646 | 152 | HP_TagHandler(wxHtmlBookRecord *b) : wxHtmlTagHandler() |
91fa114d VS |
153 | { |
154 | m_data = NULL; | |
155 | m_book = b; | |
156 | m_name = m_page = wxEmptyString; | |
157 | m_level = 0; | |
d1da8872 | 158 | m_id = wxID_ANY; |
91fa114d VS |
159 | m_count = 0; |
160 | m_parentItem = NULL; | |
161 | } | |
66a77a74 | 162 | wxString GetSupportedTags() { return wxT("UL,OBJECT,PARAM"); } |
8ec2b484 | 163 | bool HandleTag(const wxHtmlTag& tag); |
91fa114d VS |
164 | |
165 | void Reset(wxHtmlHelpDataItems& data) | |
166 | { | |
167 | m_data = &data; | |
168 | m_count = 0; | |
169 | m_level = 0; | |
170 | m_parentItem = NULL; | |
171 | } | |
22f3361e VZ |
172 | |
173 | DECLARE_NO_COPY_CLASS(HP_TagHandler) | |
8ec2b484 HH |
174 | }; |
175 | ||
176 | ||
177 | bool HP_TagHandler::HandleTag(const wxHtmlTag& tag) | |
178 | { | |
04dbb646 | 179 | if (tag.GetName() == wxT("UL")) |
4f9297b0 | 180 | { |
91fa114d VS |
181 | wxHtmlHelpDataItem *oldparent = m_parentItem; |
182 | m_level++; | |
183 | m_parentItem = (m_count > 0) ? &(*m_data)[m_data->size()-1] : NULL; | |
8ec2b484 | 184 | ParseInner(tag); |
91fa114d VS |
185 | m_level--; |
186 | m_parentItem = oldparent; | |
187 | return true; | |
8ec2b484 | 188 | } |
04dbb646 | 189 | else if (tag.GetName() == wxT("OBJECT")) |
4f9297b0 | 190 | { |
91fa114d | 191 | m_name = m_page = wxEmptyString; |
8ec2b484 | 192 | ParseInner(tag); |
50494a55 | 193 | |
daa084c2 | 194 | #if 0 |
91fa114d | 195 | if (!page.IsEmpty()) |
7df9fbc3 | 196 | /* Valid HHW's file may contain only two object tags: |
04dbb646 | 197 | |
4157f43f VS |
198 | <OBJECT type="text/site properties"> |
199 | <param name="ImageType" value="Folder"> | |
200 | </OBJECT> | |
04dbb646 | 201 | |
4157f43f | 202 | or |
04dbb646 VZ |
203 | |
204 | <OBJECT type="text/sitemap"> | |
205 | <param name="Name" value="main page"> | |
206 | <param name="Local" value="another.htm"> | |
207 | </OBJECT> | |
208 | ||
91fa114d | 209 | We're interested in the latter. !page.IsEmpty() is valid |
4157f43f VS |
210 | condition because text/site properties does not contain Local param |
211 | */ | |
daa084c2 VS |
212 | #endif |
213 | if (tag.GetParam(wxT("TYPE")) == wxT("text/sitemap")) | |
4157f43f | 214 | { |
91fa114d VS |
215 | wxHtmlHelpDataItem *item = new wxHtmlHelpDataItem(); |
216 | item->parent = m_parentItem; | |
217 | item->level = m_level; | |
218 | item->id = m_id; | |
219 | item->page = m_page; | |
220 | item->name = m_name; | |
d1da8872 | 221 | |
91fa114d VS |
222 | item->book = m_book; |
223 | m_data->Add(item); | |
224 | m_count++; | |
4157f43f | 225 | } |
50494a55 | 226 | |
91fa114d | 227 | return true; |
8ec2b484 | 228 | } |
04dbb646 | 229 | else |
4f9297b0 | 230 | { // "PARAM" |
91fa114d VS |
231 | if (m_name.empty() && tag.GetParam(wxT("NAME")) == wxT("Name")) |
232 | m_name = tag.GetParam(wxT("VALUE")); | |
04dbb646 | 233 | if (tag.GetParam(wxT("NAME")) == wxT("Local")) |
91fa114d | 234 | m_page = tag.GetParam(wxT("VALUE")); |
04dbb646 | 235 | if (tag.GetParam(wxT("NAME")) == wxT("ID")) |
91fa114d VS |
236 | tag.GetParamAsInt(wxT("VALUE"), &m_id); |
237 | return false; | |
8ec2b484 HH |
238 | } |
239 | } | |
240 | ||
241 | ||
8ec2b484 HH |
242 | //----------------------------------------------------------------------------- |
243 | // wxHtmlHelpData | |
244 | //----------------------------------------------------------------------------- | |
245 | ||
468ae730 VS |
246 | wxString wxHtmlBookRecord::GetFullPath(const wxString &page) const |
247 | { | |
248 | if (wxIsAbsolutePath(page)) | |
249 | return page; | |
250 | else | |
251 | return m_BasePath + page; | |
252 | } | |
253 | ||
91fa114d VS |
254 | wxString wxHtmlHelpDataItem::GetIndentedName() const |
255 | { | |
256 | wxString s; | |
257 | for (int i = 1; i < level; i++) | |
258 | s << _T(" "); | |
259 | s << name; | |
260 | return s; | |
261 | } | |
468ae730 VS |
262 | |
263 | ||
8ec2b484 HH |
264 | IMPLEMENT_DYNAMIC_CLASS(wxHtmlHelpData, wxObject) |
265 | ||
f42b1601 | 266 | wxHtmlHelpData::wxHtmlHelpData() |
8ec2b484 | 267 | { |
91fa114d VS |
268 | #if WXWIN_COMPATIBILITY_2_4 |
269 | m_cacheContents = NULL; | |
270 | m_cacheIndex = NULL; | |
271 | #endif | |
8ec2b484 HH |
272 | } |
273 | ||
274 | wxHtmlHelpData::~wxHtmlHelpData() | |
275 | { | |
91fa114d VS |
276 | #if WXWIN_COMPATIBILITY_2_4 |
277 | CleanCompatibilityData(); | |
278 | #endif | |
8ec2b484 HH |
279 | } |
280 | ||
67c276bd VS |
281 | bool wxHtmlHelpData::LoadMSProject(wxHtmlBookRecord *book, wxFileSystem& fsys, |
282 | const wxString& indexfile, | |
283 | const wxString& contentsfile) | |
8ec2b484 HH |
284 | { |
285 | wxFSFile *f; | |
2b5f62a0 | 286 | wxHtmlFilterHTML filter; |
eb37e1d2 | 287 | wxString buf; |
8ec2b484 | 288 | wxString string; |
f42b1601 | 289 | |
8ec2b484 HH |
290 | HP_Parser parser; |
291 | HP_TagHandler *handler = new HP_TagHandler(book); | |
292 | parser.AddTagHandler(handler); | |
293 | ||
93763ad5 | 294 | f = ( contentsfile.empty() ? (wxFSFile*) NULL : fsys.OpenFile(contentsfile) ); |
04dbb646 | 295 | if (f) |
4f9297b0 | 296 | { |
eb37e1d2 | 297 | buf.clear(); |
2b5f62a0 | 298 | buf = filter.ReadFile(*f); |
8ec2b484 | 299 | delete f; |
91fa114d | 300 | handler->Reset(m_contents); |
8ec2b484 | 301 | parser.Parse(buf); |
8ec2b484 | 302 | } |
f3c82859 | 303 | else |
2b5f62a0 | 304 | { |
f6bcfd97 | 305 | wxLogError(_("Cannot open contents file: %s"), contentsfile.c_str()); |
2b5f62a0 | 306 | } |
8ec2b484 | 307 | |
93763ad5 | 308 | f = ( indexfile.empty() ? (wxFSFile*) NULL : fsys.OpenFile(indexfile) ); |
04dbb646 | 309 | if (f) |
4f9297b0 | 310 | { |
eb37e1d2 | 311 | buf.clear(); |
2b5f62a0 | 312 | buf = filter.ReadFile(*f); |
8ec2b484 | 313 | delete f; |
91fa114d | 314 | handler->Reset(m_index); |
8ec2b484 | 315 | parser.Parse(buf); |
8ec2b484 | 316 | } |
93763ad5 | 317 | else if (!indexfile.empty()) |
2b5f62a0 | 318 | { |
f6bcfd97 | 319 | wxLogError(_("Cannot open index file: %s"), indexfile.c_str()); |
2b5f62a0 | 320 | } |
d1da8872 | 321 | return true; |
8ec2b484 HH |
322 | } |
323 | ||
4fd5055c VS |
324 | inline static void CacheWriteInt32(wxOutputStream *f, wxInt32 value) |
325 | { | |
326 | wxInt32 x = wxINT32_SWAP_ON_BE(value); | |
327 | f->Write(&x, sizeof(x)); | |
328 | } | |
f35822af | 329 | |
4fd5055c VS |
330 | inline static wxInt32 CacheReadInt32(wxInputStream *f) |
331 | { | |
332 | wxInt32 x; | |
333 | f->Read(&x, sizeof(x)); | |
334 | return wxINT32_SWAP_ON_BE(x); | |
335 | } | |
f35822af | 336 | |
3912b3f8 | 337 | inline static void CacheWriteString(wxOutputStream *f, const wxString& str) |
d1da8872 | 338 | { |
3912b3f8 VS |
339 | const wxWX2MBbuf mbstr = str.mb_str(wxConvUTF8); |
340 | size_t len = strlen((const char*)mbstr)+1; | |
4fd5055c | 341 | CacheWriteInt32(f, len); |
3912b3f8 | 342 | f->Write((const char*)mbstr, len); |
4fd5055c | 343 | } |
f35822af | 344 | |
3912b3f8 | 345 | inline static wxString CacheReadString(wxInputStream *f) |
4fd5055c | 346 | { |
4fd5055c | 347 | size_t len = (size_t)CacheReadInt32(f); |
3912b3f8 VS |
348 | wxCharBuffer str(len-1); |
349 | f->Read(str.data(), len); | |
350 | return wxString(str, wxConvUTF8); | |
4fd5055c | 351 | } |
f35822af | 352 | |
91fa114d | 353 | #define CURRENT_CACHED_BOOK_VERSION 5 |
d1a9c82b VS |
354 | |
355 | // Additional flags to detect incompatibilities of the runtime environment: | |
356 | #define CACHED_BOOK_FORMAT_FLAGS \ | |
357 | (wxUSE_UNICODE << 0) | |
358 | ||
f35822af | 359 | |
8ec2b484 HH |
360 | bool wxHtmlHelpData::LoadCachedBook(wxHtmlBookRecord *book, wxInputStream *f) |
361 | { | |
91fa114d | 362 | int i, st, newsize; |
f35822af VS |
363 | wxInt32 version; |
364 | ||
365 | /* load header - version info : */ | |
4fd5055c | 366 | version = CacheReadInt32(f); |
d1da8872 | 367 | |
04dbb646 | 368 | if (version != CURRENT_CACHED_BOOK_VERSION) |
f3c82859 | 369 | { |
d1da8872 | 370 | // NB: We can just silently return false here and don't worry about |
4fd5055c | 371 | // it anymore, because AddBookParam will load the MS project in |
d1da8872 | 372 | // absence of (properly versioned) .cached file and automatically |
4fd5055c | 373 | // create new .cached file immediately afterward. |
91fa114d | 374 | return false; |
f3c82859 | 375 | } |
04dbb646 | 376 | |
d1a9c82b | 377 | if (CacheReadInt32(f) != CACHED_BOOK_FORMAT_FLAGS) |
91fa114d | 378 | return false; |
d1a9c82b | 379 | |
8ec2b484 | 380 | /* load contents : */ |
91fa114d VS |
381 | st = m_contents.size(); |
382 | newsize = st + CacheReadInt32(f); | |
383 | m_contents.Alloc(newsize); | |
384 | for (i = st; i < newsize; i++) | |
4f9297b0 | 385 | { |
91fa114d VS |
386 | wxHtmlHelpDataItem *item = new wxHtmlHelpDataItem; |
387 | item->level = CacheReadInt32(f); | |
388 | item->id = CacheReadInt32(f); | |
389 | item->name = CacheReadString(f); | |
390 | item->page = CacheReadString(f); | |
391 | item->book = book; | |
392 | m_contents.Add(item); | |
8ec2b484 HH |
393 | } |
394 | ||
395 | /* load index : */ | |
91fa114d VS |
396 | st = m_index.size(); |
397 | newsize = st + CacheReadInt32(f); | |
398 | m_index.Alloc(newsize); | |
399 | for (i = st; i < newsize; i++) | |
4f9297b0 | 400 | { |
91fa114d VS |
401 | wxHtmlHelpDataItem *item = new wxHtmlHelpDataItem; |
402 | item->name = CacheReadString(f); | |
403 | item->page = CacheReadString(f); | |
404 | item->level = CacheReadInt32(f); | |
405 | item->book = book; | |
406 | int parentShift = CacheReadInt32(f); | |
407 | if (parentShift != 0) | |
408 | item->parent = &m_index[m_index.size() - parentShift]; | |
409 | m_index.Add(item); | |
8ec2b484 | 410 | } |
91fa114d | 411 | return true; |
8ec2b484 HH |
412 | } |
413 | ||
414 | ||
415 | bool wxHtmlHelpData::SaveCachedBook(wxHtmlBookRecord *book, wxOutputStream *f) | |
416 | { | |
417 | int i; | |
4fd5055c | 418 | wxInt32 cnt; |
f35822af VS |
419 | |
420 | /* save header - version info : */ | |
4fd5055c | 421 | CacheWriteInt32(f, CURRENT_CACHED_BOOK_VERSION); |
d1a9c82b | 422 | CacheWriteInt32(f, CACHED_BOOK_FORMAT_FLAGS); |
8ec2b484 HH |
423 | |
424 | /* save contents : */ | |
91fa114d | 425 | int len = m_contents.size(); |
d1da8872 | 426 | for (cnt = 0, i = 0; i < len; i++) |
91fa114d | 427 | if (m_contents[i].book == book && m_contents[i].level > 0) |
4fd5055c VS |
428 | cnt++; |
429 | CacheWriteInt32(f, cnt); | |
8ec2b484 | 430 | |
91fa114d | 431 | for (i = 0; i < len; i++) |
4f9297b0 | 432 | { |
d1da8872 | 433 | if (m_contents[i].book != book || m_contents[i].level == 0) |
4fd5055c | 434 | continue; |
91fa114d VS |
435 | CacheWriteInt32(f, m_contents[i].level); |
436 | CacheWriteInt32(f, m_contents[i].id); | |
437 | CacheWriteString(f, m_contents[i].name); | |
438 | CacheWriteString(f, m_contents[i].page); | |
8ec2b484 HH |
439 | } |
440 | ||
441 | /* save index : */ | |
91fa114d | 442 | len = m_index.size(); |
d1da8872 WS |
443 | for (cnt = 0, i = 0; i < len; i++) |
444 | if (m_index[i].book == book && m_index[i].level > 0) | |
4fd5055c VS |
445 | cnt++; |
446 | CacheWriteInt32(f, cnt); | |
8ec2b484 | 447 | |
91fa114d | 448 | for (i = 0; i < len; i++) |
4f9297b0 | 449 | { |
d1da8872 | 450 | if (m_index[i].book != book || m_index[i].level == 0) |
4fd5055c | 451 | continue; |
91fa114d VS |
452 | CacheWriteString(f, m_index[i].name); |
453 | CacheWriteString(f, m_index[i].page); | |
454 | CacheWriteInt32(f, m_index[i].level); | |
455 | // save distance to parent item, if any: | |
456 | if (m_index[i].parent == NULL) | |
457 | { | |
458 | CacheWriteInt32(f, 0); | |
459 | } | |
460 | else | |
461 | { | |
17a1ebd1 | 462 | int cnt2 = 0; |
91fa114d VS |
463 | wxHtmlHelpDataItem *parent = m_index[i].parent; |
464 | for (int j = i-1; j >= 0; j--) | |
465 | { | |
466 | if (m_index[j].book == book && m_index[j].level > 0) | |
17a1ebd1 | 467 | cnt2++; |
91fa114d VS |
468 | if (&m_index[j] == parent) |
469 | break; | |
470 | } | |
17a1ebd1 VZ |
471 | wxASSERT(cnt2 > 0); |
472 | CacheWriteInt32(f, cnt2); | |
91fa114d | 473 | } |
8ec2b484 | 474 | } |
91fa114d | 475 | return true; |
8ec2b484 HH |
476 | } |
477 | ||
478 | ||
479 | void wxHtmlHelpData::SetTempDir(const wxString& path) | |
480 | { | |
91fa114d VS |
481 | if (path.empty()) |
482 | m_tempPath = path; | |
04dbb646 | 483 | else |
4f9297b0 | 484 | { |
91fa114d VS |
485 | if (wxIsAbsolutePath(path)) m_tempPath = path; |
486 | else m_tempPath = wxGetCwd() + _T("/") + path; | |
8ec2b484 | 487 | |
93763ad5 | 488 | if (m_tempPath[m_tempPath.length() - 1] != _T('/')) |
91fa114d | 489 | m_tempPath << _T('/'); |
8ec2b484 HH |
490 | } |
491 | } | |
492 | ||
493 | ||
29e60597 VS |
494 | |
495 | static wxString SafeFileName(const wxString& s) | |
496 | { | |
497 | wxString res(s); | |
498 | res.Replace(wxT("#"), wxT("_")); | |
499 | res.Replace(wxT(":"), wxT("_")); | |
500 | res.Replace(wxT("\\"), wxT("_")); | |
501 | res.Replace(wxT("/"), wxT("_")); | |
502 | return res; | |
503 | } | |
504 | ||
f35822af | 505 | bool wxHtmlHelpData::AddBookParam(const wxFSFile& bookfile, |
f890e2d4 | 506 | wxFontEncoding encoding, |
f35822af | 507 | const wxString& title, const wxString& contfile, |
d5bb85a0 VS |
508 | const wxString& indexfile, const wxString& deftopic, |
509 | const wxString& path) | |
8ec2b484 HH |
510 | { |
511 | wxFileSystem fsys; | |
512 | wxFSFile *fi; | |
513 | wxHtmlBookRecord *bookr; | |
04dbb646 | 514 | |
91fa114d VS |
515 | int IndexOld = m_index.size(), |
516 | ContentsOld = m_contents.size(); | |
f42b1601 | 517 | |
93763ad5 | 518 | if (!path.empty()) |
d1da8872 | 519 | fsys.ChangePathTo(path, true); |
8ec2b484 | 520 | |
91fa114d | 521 | size_t booksCnt = m_bookRecords.GetCount(); |
5ecdcaa7 VS |
522 | for (size_t i = 0; i < booksCnt; i++) |
523 | { | |
91fa114d VS |
524 | if ( m_bookRecords[i].GetBookFile() == bookfile.GetLocation() ) |
525 | return true; // book is (was) loaded | |
5ecdcaa7 VS |
526 | } |
527 | ||
528 | bookr = new wxHtmlBookRecord(bookfile.GetLocation(), fsys.GetPath(), title, deftopic); | |
d1da8872 | 529 | |
91fa114d VS |
530 | wxHtmlHelpDataItem *bookitem = new wxHtmlHelpDataItem; |
531 | bookitem->level = 0; | |
532 | bookitem->id = 0; | |
533 | bookitem->page = deftopic; | |
534 | bookitem->name = title; | |
535 | bookitem->book = bookr; | |
8ec2b484 HH |
536 | |
537 | // store the contents index for later | |
91fa114d VS |
538 | int cont_start = m_contents.size(); |
539 | ||
540 | m_contents.Add(bookitem); | |
8ec2b484 HH |
541 | |
542 | // Try to find cached binary versions: | |
f35822af VS |
543 | // 1. save file as book, but with .hhp.cached extension |
544 | // 2. same as 1. but in temp path | |
545 | // 3. otherwise or if cache load failed, load it from MS. | |
04dbb646 | 546 | |
f35822af | 547 | fi = fsys.OpenFile(bookfile.GetLocation() + wxT(".cached")); |
04dbb646 VZ |
548 | |
549 | if (fi == NULL || | |
e2b87f38 | 550 | #if wxUSE_DATETIME |
04dbb646 | 551 | fi->GetModificationTime() < bookfile.GetModificationTime() || |
e2b87f38 | 552 | #endif // wxUSE_DATETIME |
4f9297b0 | 553 | !LoadCachedBook(bookr, fi->GetStream())) |
f35822af VS |
554 | { |
555 | if (fi != NULL) delete fi; | |
91fa114d VS |
556 | fi = fsys.OpenFile(m_tempPath + wxFileNameFromPath(bookfile.GetLocation()) + wxT(".cached")); |
557 | if (m_tempPath.empty() || fi == NULL || | |
e2b87f38 | 558 | #if wxUSE_DATETIME |
04dbb646 | 559 | fi->GetModificationTime() < bookfile.GetModificationTime() || |
e2b87f38 | 560 | #endif // wxUSE_DATETIME |
4f9297b0 | 561 | !LoadCachedBook(bookr, fi->GetStream())) |
f35822af VS |
562 | { |
563 | LoadMSProject(bookr, fsys, indexfile, contfile); | |
91fa114d | 564 | if (!m_tempPath.empty()) |
f35822af | 565 | { |
91fa114d | 566 | wxFileOutputStream *outs = new wxFileOutputStream(m_tempPath + |
29e60597 | 567 | SafeFileName(wxFileNameFromPath(bookfile.GetLocation())) + wxT(".cached")); |
f35822af VS |
568 | SaveCachedBook(bookr, outs); |
569 | delete outs; | |
570 | } | |
d5bb85a0 | 571 | } |
8ec2b484 | 572 | } |
04dbb646 | 573 | |
f35822af | 574 | if (fi != NULL) delete fi; |
8ec2b484 HH |
575 | |
576 | // Now store the contents range | |
91fa114d | 577 | bookr->SetContentsRange(cont_start, m_contents.size()); |
04dbb646 | 578 | |
3912b3f8 VS |
579 | #if wxUSE_WCHAR_T |
580 | // MS HTML Help files [written by MS HTML Help Workshop] are broken | |
581 | // in that the data are iso-8859-1 (including HTML entities), but must | |
582 | // be interpreted as being in language's windows charset. Correct the | |
583 | // differences here and also convert to wxConvLocal in ANSI build | |
67c276bd | 584 | if (encoding != wxFONTENCODING_SYSTEM) |
3912b3f8 VS |
585 | { |
586 | #if wxUSE_UNICODE | |
587 | #define CORRECT_STR(str, conv) \ | |
588 | str = wxString((str).mb_str(wxConvISO8859_1), conv) | |
589 | #else | |
590 | #define CORRECT_STR(str, conv) \ | |
591 | str = wxString((str).wc_str(conv), wxConvLocal) | |
592 | #endif | |
67c276bd | 593 | wxCSConv conv(encoding); |
91fa114d VS |
594 | size_t IndexCnt = m_index.size(); |
595 | size_t ContentsCnt = m_contents.size(); | |
596 | size_t i; | |
597 | for (i = IndexOld; i < IndexCnt; i++) | |
f890e2d4 | 598 | { |
91fa114d | 599 | CORRECT_STR(m_index[i].name, conv); |
f890e2d4 | 600 | } |
91fa114d | 601 | for (i = ContentsOld; i < ContentsCnt; i++) |
3912b3f8 | 602 | { |
91fa114d | 603 | CORRECT_STR(m_contents[i].name, conv); |
3912b3f8 VS |
604 | } |
605 | #undef CORRECT_STR | |
f890e2d4 | 606 | } |
0b4f47a3 DS |
607 | #else |
608 | wxUnusedVar(IndexOld); | |
609 | wxUnusedVar(ContentsOld); | |
67c276bd | 610 | wxASSERT_MSG(encoding == wxFONTENCODING_SYSTEM, wxT("Help files need charset conversion, but wxUSE_WCHAR_T is 0")); |
3912b3f8 | 611 | #endif // wxUSE_WCHAR_T/!wxUSE_WCHAR_T |
8ec2b484 | 612 | |
91fa114d VS |
613 | m_bookRecords.Add(bookr); |
614 | if (!m_index.empty()) | |
615 | { | |
616 | m_index.Sort(wxHtmlHelpIndexCompareFunc); | |
617 | } | |
f42b1601 | 618 | |
91fa114d | 619 | return true; |
8ec2b484 HH |
620 | } |
621 | ||
622 | ||
623 | bool wxHtmlHelpData::AddBook(const wxString& book) | |
624 | { | |
3527f29c VS |
625 | wxString extension(book.Right(4).Lower()); |
626 | if (extension == wxT(".zip") || | |
627 | #if wxUSE_LIBMSPACK | |
628 | extension == wxT(".chm") /*compressed html help book*/ || | |
629 | #endif | |
630 | extension == wxT(".htb") /*html book*/) | |
68364659 VS |
631 | { |
632 | wxFileSystem fsys; | |
633 | wxString s; | |
d1da8872 | 634 | bool rt = false; |
68364659 | 635 | |
3527f29c VS |
636 | #if wxUSE_LIBMSPACK |
637 | if (extension == wxT(".chm")) | |
638 | s = fsys.FindFirst(book + wxT("#chm:*.hhp"), wxFILE); | |
639 | else | |
640 | #endif | |
641 | s = fsys.FindFirst(book + wxT("#zip:*.hhp"), wxFILE); | |
642 | ||
93763ad5 | 643 | while (!s.empty()) |
68364659 | 644 | { |
d1da8872 | 645 | if (AddBook(s)) rt = true; |
68364659 VS |
646 | s = fsys.FindNext(); |
647 | } | |
04dbb646 | 648 | |
68364659 VS |
649 | return rt; |
650 | } | |
68364659 | 651 | |
a509f830 VZ |
652 | wxFSFile *fi; |
653 | wxFileSystem fsys; | |
3dde6c72 | 654 | |
a509f830 VZ |
655 | wxString title = _("noname"), |
656 | safetitle, | |
657 | start = wxEmptyString, | |
658 | contents = wxEmptyString, | |
659 | index = wxEmptyString, | |
660 | charset = wxEmptyString; | |
68364659 | 661 | |
a509f830 VZ |
662 | fi = fsys.OpenFile(book); |
663 | if (fi == NULL) | |
664 | { | |
665 | wxLogError(_("Cannot open HTML help book: %s"), book.c_str()); | |
d1da8872 | 666 | return false; |
68364659 | 667 | } |
a509f830 VZ |
668 | fsys.ChangePathTo(book); |
669 | ||
670 | const wxChar *lineptr; | |
671 | wxChar linebuf[300]; | |
672 | wxString tmp; | |
673 | wxHtmlFilterPlainText filter; | |
674 | tmp = filter.ReadFile(*fi); | |
675 | lineptr = tmp.c_str(); | |
676 | ||
d1da8872 | 677 | do |
a509f830 VZ |
678 | { |
679 | lineptr = ReadLine(lineptr, linebuf, 300); | |
d1da8872 | 680 | |
a509f830 | 681 | for (wxChar *ch = linebuf; *ch != wxT('\0') && *ch != wxT('='); ch++) |
42841dfc | 682 | *ch = (wxChar)wxTolower(*ch); |
a509f830 VZ |
683 | |
684 | if (wxStrstr(linebuf, _T("title=")) == linebuf) | |
685 | title = linebuf + wxStrlen(_T("title=")); | |
686 | if (wxStrstr(linebuf, _T("default topic=")) == linebuf) | |
687 | start = linebuf + wxStrlen(_T("default topic=")); | |
688 | if (wxStrstr(linebuf, _T("index file=")) == linebuf) | |
689 | index = linebuf + wxStrlen(_T("index file=")); | |
690 | if (wxStrstr(linebuf, _T("contents file=")) == linebuf) | |
691 | contents = linebuf + wxStrlen(_T("contents file=")); | |
692 | if (wxStrstr(linebuf, _T("charset=")) == linebuf) | |
693 | charset = linebuf + wxStrlen(_T("charset=")); | |
694 | } while (lineptr != NULL); | |
d1da8872 | 695 | |
5a969262 RR |
696 | wxFontEncoding enc = wxFONTENCODING_SYSTEM; |
697 | #if wxUSE_FONTMAP | |
698 | if (charset != wxEmptyString) | |
699 | enc = wxFontMapper::Get()->CharsetToEncoding(charset); | |
700 | #endif | |
a509f830 | 701 | |
67c276bd | 702 | bool rtval = AddBookParam(*fi, enc, |
a509f830 VZ |
703 | title, contents, index, start, fsys.GetPath()); |
704 | delete fi; | |
91fa114d VS |
705 | |
706 | #if WXWIN_COMPATIBILITY_2_4 | |
707 | CleanCompatibilityData(); | |
708 | #endif | |
709 | ||
a509f830 | 710 | return rtval; |
8ec2b484 HH |
711 | } |
712 | ||
713 | wxString wxHtmlHelpData::FindPageByName(const wxString& x) | |
714 | { | |
715 | int cnt; | |
716 | int i; | |
717 | wxFileSystem fsys; | |
718 | wxFSFile *f; | |
8ec2b484 | 719 | |
735a74df | 720 | // 1. try to open given file: |
91fa114d | 721 | cnt = m_bookRecords.GetCount(); |
04dbb646 | 722 | for (i = 0; i < cnt; i++) |
4f9297b0 | 723 | { |
91fa114d | 724 | f = fsys.OpenFile(m_bookRecords[i].GetFullPath(x)); |
04dbb646 VZ |
725 | if (f) |
726 | { | |
91fa114d | 727 | wxString url = m_bookRecords[i].GetFullPath(x); |
8ec2b484 HH |
728 | delete f; |
729 | return url; | |
730 | } | |
731 | } | |
732 | ||
733 | ||
735a74df | 734 | // 2. try to find a book: |
04dbb646 | 735 | for (i = 0; i < cnt; i++) |
4f9297b0 | 736 | { |
91fa114d VS |
737 | if (m_bookRecords[i].GetTitle() == x) |
738 | return m_bookRecords[i].GetFullPath(m_bookRecords[i].GetStart()); | |
8ec2b484 HH |
739 | } |
740 | ||
735a74df | 741 | // 3. try to find in contents: |
91fa114d | 742 | cnt = m_contents.size(); |
04dbb646 | 743 | for (i = 0; i < cnt; i++) |
4f9297b0 | 744 | { |
91fa114d VS |
745 | if (m_contents[i].name == x) |
746 | return m_contents[i].GetFullPath(); | |
8ec2b484 HH |
747 | } |
748 | ||
749 | ||
735a74df | 750 | // 4. try to find in index: |
91fa114d | 751 | cnt = m_index.size(); |
04dbb646 | 752 | for (i = 0; i < cnt; i++) |
4f9297b0 | 753 | { |
91fa114d VS |
754 | if (m_index[i].name == x) |
755 | return m_index[i].GetFullPath(); | |
8ec2b484 HH |
756 | } |
757 | ||
735a74df VZ |
758 | // 4b. if still not found, try case-insensitive comparison |
759 | for (i = 0; i < cnt; i++) | |
760 | { | |
761 | if (m_index[i].name.CmpNoCase(x) == 0) | |
762 | return m_index[i].GetFullPath(); | |
763 | } | |
764 | ||
91fa114d | 765 | return wxEmptyString; |
8ec2b484 HH |
766 | } |
767 | ||
768 | wxString wxHtmlHelpData::FindPageById(int id) | |
f42b1601 | 769 | { |
91fa114d VS |
770 | size_t cnt = m_contents.size(); |
771 | for (size_t i = 0; i < cnt; i++) | |
4f9297b0 | 772 | { |
91fa114d | 773 | if (m_contents[i].id == id) |
04dbb646 | 774 | { |
91fa114d | 775 | return m_contents[i].GetFullPath(); |
8ec2b484 HH |
776 | } |
777 | } | |
778 | ||
91fa114d VS |
779 | return wxEmptyString; |
780 | } | |
781 | ||
782 | #if WXWIN_COMPATIBILITY_2_4 | |
783 | wxHtmlContentsItem::wxHtmlContentsItem() | |
d1da8872 | 784 | : m_Level(0), m_ID(wxID_ANY), m_Name(NULL), m_Page(NULL), m_Book(NULL), |
91fa114d VS |
785 | m_autofree(false) |
786 | { | |
787 | } | |
788 | ||
789 | wxHtmlContentsItem::wxHtmlContentsItem(const wxHtmlHelpDataItem& d) | |
790 | { | |
791 | m_autofree = true; | |
792 | m_Level = d.level; | |
793 | m_ID = d.id; | |
794 | m_Name = wxStrdup(d.name.c_str()); | |
795 | m_Page = wxStrdup(d.page.c_str()); | |
796 | m_Book = d.book; | |
797 | } | |
798 | ||
799 | wxHtmlContentsItem& wxHtmlContentsItem::operator=(const wxHtmlContentsItem& d) | |
800 | { | |
801 | if (m_autofree) | |
802 | { | |
803 | free(m_Name); | |
804 | free(m_Page); | |
805 | } | |
806 | m_autofree = true; | |
807 | m_Level = d.m_Level; | |
808 | m_ID = d.m_ID; | |
809 | m_Name = d.m_Name ? wxStrdup(d.m_Name) : NULL; | |
810 | m_Page = d.m_Page ? wxStrdup(d.m_Page) : NULL; | |
811 | m_Book = d.m_Book; | |
812 | return *this; | |
8ec2b484 HH |
813 | } |
814 | ||
91fa114d VS |
815 | wxHtmlContentsItem::~wxHtmlContentsItem() |
816 | { | |
817 | if (m_autofree) | |
818 | { | |
819 | free(m_Name); | |
820 | free(m_Page); | |
821 | } | |
822 | } | |
823 | ||
824 | wxHtmlContentsItem* wxHtmlHelpData::GetContents() | |
825 | { | |
826 | if (!m_cacheContents && !m_contents.empty()) | |
827 | { | |
828 | size_t len = m_contents.size(); | |
829 | m_cacheContents = new wxHtmlContentsItem[len]; | |
830 | for (size_t i = 0; i < len; i++) | |
831 | m_cacheContents[i] = m_contents[i]; | |
832 | } | |
833 | return m_cacheContents; | |
834 | } | |
835 | ||
836 | int wxHtmlHelpData::GetContentsCnt() | |
837 | { | |
838 | return m_contents.size(); | |
839 | } | |
840 | ||
841 | wxHtmlContentsItem* wxHtmlHelpData::GetIndex() | |
842 | { | |
843 | if (!m_cacheContents && !m_index.empty()) | |
844 | { | |
845 | size_t len = m_index.size(); | |
846 | m_cacheContents = new wxHtmlContentsItem[len]; | |
847 | for (size_t i = 0; i < len; i++) | |
848 | m_cacheContents[i] = m_index[i]; | |
849 | } | |
850 | return m_cacheContents; | |
851 | } | |
852 | ||
853 | int wxHtmlHelpData::GetIndexCnt() | |
854 | { | |
855 | return m_index.size(); | |
856 | } | |
857 | ||
858 | void wxHtmlHelpData::CleanCompatibilityData() | |
859 | { | |
860 | delete[] m_cacheContents; | |
861 | m_cacheContents = NULL; | |
862 | delete[] m_cacheIndex; | |
863 | m_cacheIndex = NULL; | |
864 | } | |
865 | #endif // WXWIN_COMPATIBILITY_2_4 | |
866 | ||
8ec2b484 HH |
867 | //---------------------------------------------------------------------------------- |
868 | // wxHtmlSearchStatus functions | |
869 | //---------------------------------------------------------------------------------- | |
870 | ||
871 | wxHtmlSearchStatus::wxHtmlSearchStatus(wxHtmlHelpData* data, const wxString& keyword, | |
c4971147 | 872 | bool case_sensitive, bool whole_words_only, |
d5bb85a0 | 873 | const wxString& book) |
8ec2b484 HH |
874 | { |
875 | m_Data = data; | |
876 | m_Keyword = keyword; | |
877 | wxHtmlBookRecord* bookr = NULL; | |
04dbb646 | 878 | if (book != wxEmptyString) |
4f9297b0 | 879 | { |
d5bb85a0 | 880 | // we have to search in a specific book. Find it first |
91fa114d | 881 | int i, cnt = data->m_bookRecords.GetCount(); |
d5bb85a0 | 882 | for (i = 0; i < cnt; i++) |
91fa114d | 883 | if (data->m_bookRecords[i].GetTitle() == book) |
04dbb646 | 884 | { |
91fa114d | 885 | bookr = &(data->m_bookRecords[i]); |
d5bb85a0 VS |
886 | m_CurIndex = bookr->GetContentsStart(); |
887 | m_MaxIndex = bookr->GetContentsEnd(); | |
888 | break; | |
889 | } | |
890 | // check; we won't crash if the book doesn't exist, but it's Bad Anyway. | |
891 | wxASSERT(bookr); | |
8ec2b484 | 892 | } |
04dbb646 | 893 | if (! bookr) |
4f9297b0 | 894 | { |
d5bb85a0 VS |
895 | // no book specified; search all books |
896 | m_CurIndex = 0; | |
91fa114d | 897 | m_MaxIndex = m_Data->m_contents.size(); |
8ec2b484 | 898 | } |
c4971147 | 899 | m_Engine.LookFor(keyword, case_sensitive, whole_words_only); |
8ec2b484 | 900 | m_Active = (m_CurIndex < m_MaxIndex); |
8ec2b484 HH |
901 | } |
902 | ||
91fa114d VS |
903 | #if WXWIN_COMPATIBILITY_2_4 |
904 | wxHtmlContentsItem* wxHtmlSearchStatus::GetContentsItem() | |
905 | { | |
906 | static wxHtmlContentsItem it; | |
907 | it = wxHtmlContentsItem(*m_CurItem); | |
908 | return ⁢ | |
909 | } | |
910 | #endif | |
911 | ||
8ec2b484 HH |
912 | bool wxHtmlSearchStatus::Search() |
913 | { | |
8ec2b484 | 914 | wxFSFile *file; |
d5bb85a0 | 915 | int i = m_CurIndex; // shortcut |
91fa114d | 916 | bool found = false; |
3912b3f8 | 917 | wxString thepage; |
8ec2b484 | 918 | |
04dbb646 | 919 | if (!m_Active) |
4f9297b0 | 920 | { |
f35822af | 921 | // sanity check. Illegal use, but we'll try to prevent a crash anyway |
50494a55 | 922 | wxASSERT(m_Active); |
91fa114d | 923 | return false; |
8ec2b484 HH |
924 | } |
925 | ||
8ec2b484 | 926 | m_Name = wxEmptyString; |
91fa114d VS |
927 | m_CurItem = NULL; |
928 | thepage = m_Data->m_contents[i].page; | |
8ec2b484 | 929 | |
b5a7b000 VS |
930 | m_Active = (++m_CurIndex < m_MaxIndex); |
931 | // check if it is same page with different anchor: | |
3912b3f8 | 932 | if (!m_LastPage.empty()) |
b5a7b000 | 933 | { |
3912b3f8 VS |
934 | const wxChar *p1, *p2; |
935 | for (p1 = thepage.c_str(), p2 = m_LastPage.c_str(); | |
b5a7b000 VS |
936 | *p1 != 0 && *p1 != _T('#') && *p1 == *p2; p1++, p2++) {} |
937 | ||
938 | m_LastPage = thepage; | |
939 | ||
940 | if (*p1 == 0 || *p1 == _T('#')) | |
3912b3f8 | 941 | return false; |
b5a7b000 VS |
942 | } |
943 | else m_LastPage = thepage; | |
04dbb646 | 944 | |
f35822af | 945 | wxFileSystem fsys; |
91fa114d | 946 | file = fsys.OpenFile(m_Data->m_contents[i].book->GetFullPath(thepage)); |
04dbb646 | 947 | if (file) |
b5a7b000 | 948 | { |
2b5f62a0 | 949 | if (m_Engine.Scan(*file)) |
468ae730 | 950 | { |
91fa114d VS |
951 | m_Name = m_Data->m_contents[i].name; |
952 | m_CurItem = &m_Data->m_contents[i]; | |
953 | found = true; | |
d5bb85a0 VS |
954 | } |
955 | delete file; | |
8ec2b484 | 956 | } |
8ec2b484 HH |
957 | return found; |
958 | } | |
959 | ||
d5bb85a0 VS |
960 | |
961 | ||
962 | ||
963 | ||
964 | ||
965 | ||
966 | ||
967 | //-------------------------------------------------------------------------------- | |
2b5f62a0 | 968 | // wxHtmlSearchEngine |
d5bb85a0 VS |
969 | //-------------------------------------------------------------------------------- |
970 | ||
2b5f62a0 | 971 | void wxHtmlSearchEngine::LookFor(const wxString& keyword, bool case_sensitive, bool whole_words_only) |
d5bb85a0 | 972 | { |
c4971147 VS |
973 | m_CaseSensitive = case_sensitive; |
974 | m_WholeWords = whole_words_only; | |
3912b3f8 | 975 | m_Keyword = keyword; |
04dbb646 | 976 | |
3444e4a8 | 977 | if (!m_CaseSensitive) |
3912b3f8 | 978 | m_Keyword.LowerCase(); |
d5bb85a0 VS |
979 | } |
980 | ||
981 | ||
1a1dac18 MB |
982 | static inline bool WHITESPACE(wxChar c) |
983 | { | |
984 | return c == _T(' ') || c == _T('\n') || c == _T('\r') || c == _T('\t'); | |
985 | } | |
c4971147 | 986 | |
21dc4638 VZ |
987 | // replace continuous spaces by one single space |
988 | static inline wxString CompressSpaces(const wxString & str) | |
989 | { | |
990 | wxString buf; | |
991 | buf.reserve( str.size() ); | |
992 | ||
993 | bool space_counted = false; | |
994 | for( const wxChar * pstr = str.c_str(); *pstr; ++pstr ) | |
995 | { | |
996 | wxChar ch = *pstr; | |
997 | if( WHITESPACE( ch ) ) | |
998 | { | |
999 | if( space_counted ) | |
1000 | { | |
1001 | continue; | |
1002 | } | |
1003 | ch = _T(' '); | |
1004 | space_counted = true; | |
1005 | } | |
1006 | else | |
1007 | { | |
1008 | space_counted = false; | |
1009 | } | |
1010 | buf += ch; | |
1011 | } | |
1012 | ||
1013 | return buf; | |
1014 | } | |
1015 | ||
2b5f62a0 | 1016 | bool wxHtmlSearchEngine::Scan(const wxFSFile& file) |
d5bb85a0 | 1017 | { |
3912b3f8 | 1018 | wxASSERT_MSG(!m_Keyword.empty(), wxT("wxHtmlSearchEngine::LookFor must be called before scanning!")); |
d5bb85a0 | 1019 | |
2b5f62a0 | 1020 | wxHtmlFilterHTML filter; |
21dc4638 | 1021 | wxString bufStr = filter.ReadFile(file); |
d5bb85a0 | 1022 | |
c4971147 | 1023 | if (!m_CaseSensitive) |
21dc4638 | 1024 | bufStr.LowerCase(); |
d5bb85a0 | 1025 | |
21dc4638 VZ |
1026 | { // remove html tags |
1027 | wxString bufStrCopy; | |
1028 | bufStrCopy.reserve( bufStr.size() ); | |
1029 | bool insideTag = false; | |
1030 | for (const wxChar * pBufStr = bufStr.c_str(); *pBufStr; ++pBufStr) | |
04dbb646 | 1031 | { |
21dc4638 VZ |
1032 | wxChar c = *pBufStr; |
1033 | if (insideTag) | |
1034 | { | |
1035 | if (c == _T('>')) | |
1036 | { | |
1037 | insideTag = false; | |
1038 | // replace the tag by an empty space | |
1039 | c = _T(' '); | |
1040 | } | |
1041 | else | |
1042 | continue; | |
1043 | } | |
1044 | else if (c == _T('<')) | |
1045 | { | |
1046 | wxChar nextCh = *(pBufStr + 1); | |
1047 | if (nextCh == _T('/') || !WHITESPACE(nextCh)) | |
1048 | { | |
1049 | insideTag = true; | |
1050 | continue; | |
1051 | } | |
1052 | } | |
1053 | bufStrCopy += c; | |
c4971147 | 1054 | } |
21dc4638 | 1055 | bufStr.swap( bufStrCopy ); |
c4971147 | 1056 | } |
04dbb646 | 1057 | |
21dc4638 VZ |
1058 | wxString keyword = m_Keyword; |
1059 | ||
1060 | if (m_WholeWords) | |
c4971147 | 1061 | { |
21dc4638 VZ |
1062 | // insert ' ' at the beginning and at the end |
1063 | keyword.insert( 0, _T(" ") ); | |
1064 | keyword.append( _T(" ") ); | |
1065 | bufStr.insert( 0, _T(" ") ); | |
1066 | bufStr.append( _T(" ") ); | |
d5bb85a0 VS |
1067 | } |
1068 | ||
21dc4638 VZ |
1069 | // remove continuous spaces |
1070 | keyword = CompressSpaces( keyword ); | |
1071 | bufStr = CompressSpaces( bufStr ); | |
d5bb85a0 | 1072 | |
21dc4638 VZ |
1073 | // finally do the search |
1074 | return bufStr.find( keyword ) != wxString::npos; | |
1075 | } | |
d5bb85a0 | 1076 | |
8ec2b484 | 1077 | #endif |