]> git.saurik.com Git - wxWidgets.git/blame - src/html/helpdata.cpp
Add wxHtmlTag::GetParamAsString() convenience method.
[wxWidgets.git] / src / html / helpdata.cpp
CommitLineData
8ec2b484 1/////////////////////////////////////////////////////////////////////////////
93763ad5 2// Name: src/html/helpdata.cpp
8ec2b484 3// Purpose: wxHtmlHelpData
f42b1601 4// Notes: Based on htmlhelp.cpp, implementing a monolithic
8ec2b484
HH
5// HTML Help controller class, by Vaclav Slavik
6// Author: Harm van der Heijden and Vaclav Slavik
8ec2b484 7// Copyright: (c) Harm van der Heijden and Vaclav Slavik
65571936 8// Licence: wxWindows licence
8ec2b484
HH
9/////////////////////////////////////////////////////////////////////////////
10
8ec2b484
HH
11// For compilers that support precompilation, includes "wx.h".
12#include "wx/wxprec.h"
13
14#ifdef __BORLANDC__
93763ad5 15 #pragma hdrstop
8ec2b484
HH
16#endif
17
f6bcfd97 18#if wxUSE_HTML && wxUSE_STREAMS
8ec2b484 19
b4f4d3dd 20#ifndef WX_PRECOMP
04dbb646
VZ
21 #include "wx/intl.h"
22 #include "wx/log.h"
8ec2b484
HH
23#endif
24
401eb3de
RR
25#include <ctype.h>
26
8ec2b484
HH
27#include "wx/html/helpdata.h"
28#include "wx/tokenzr.h"
29#include "wx/wfstream.h"
30#include "wx/busyinfo.h"
f890e2d4
VS
31#include "wx/encconv.h"
32#include "wx/fontmap.h"
69941f05 33#include "wx/html/htmlpars.h"
8ec2b484 34#include "wx/html/htmldefs.h"
2b5f62a0 35#include "wx/html/htmlfilt.h"
057b55b0 36#include "wx/filename.h"
8ec2b484
HH
37
38#include "wx/arrimpl.cpp"
39WX_DEFINE_OBJARRAY(wxHtmlBookRecArray)
91fa114d 40WX_DEFINE_OBJARRAY(wxHtmlHelpDataItems)
8ec2b484
HH
41
42//-----------------------------------------------------------------------------
43// static helper functions
44//-----------------------------------------------------------------------------
45
46// Reads one line, stores it into buf and returns pointer to new line or NULL.
1a1dac18 47static const wxChar* ReadLine(const wxChar *line, wxChar *buf, size_t bufsize)
8ec2b484 48{
1a1dac18
MB
49 wxChar *writeptr = buf;
50 wxChar *endptr = buf + bufsize - 1;
51 const wxChar *readptr = line;
8ec2b484 52
9a83f860 53 while (*readptr != 0 && *readptr != wxT('\r') && *readptr != wxT('\n') &&
d1da8872 54 writeptr != endptr)
3dde6c72 55 *(writeptr++) = *(readptr++);
8ec2b484 56 *writeptr = 0;
9a83f860 57 while (*readptr == wxT('\r') || *readptr == wxT('\n'))
3dde6c72
VS
58 readptr++;
59 if (*readptr == 0)
60 return NULL;
d1da8872 61 else
3dde6c72 62 return readptr;
8ec2b484
HH
63}
64
65
8ec2b484 66
91fa114d
VS
67static int
68wxHtmlHelpIndexCompareFunc(wxHtmlHelpDataItem **a, wxHtmlHelpDataItem **b)
8ec2b484 69{
91fa114d
VS
70 wxHtmlHelpDataItem *ia = *a;
71 wxHtmlHelpDataItem *ib = *b;
3912b3f8 72
7fbe5489
VS
73 if (ia == NULL)
74 return -1;
75 if (ib == NULL)
76 return 1;
42841dfc 77
91fa114d
VS
78 if (ia->parent == ib->parent)
79 {
80 return ia->name.CmpNoCase(ib->name);
81 }
82 else if (ia->level == ib->level)
83 {
84 return wxHtmlHelpIndexCompareFunc(&ia->parent, &ib->parent);
85 }
86 else
87 {
88 wxHtmlHelpDataItem *ia2 = ia;
89 wxHtmlHelpDataItem *ib2 = ib;
d1da8872 90
91fa114d
VS
91 while (ia2->level > ib2->level)
92 {
93 ia2 = ia2->parent;
94 }
95 while (ib2->level > ia2->level)
96 {
97 ib2 = ib2->parent;
98 }
d1da8872 99
91fa114d
VS
100 wxASSERT(ia2);
101 wxASSERT(ib2);
102 int res = wxHtmlHelpIndexCompareFunc(&ia2, &ib2);
103 if (res != 0)
104 return res;
105 else if (ia->level > ib->level)
106 return 1;
107 else
108 return -1;
109 }
8ec2b484
HH
110}
111
8ec2b484
HH
112//-----------------------------------------------------------------------------
113// HP_Parser
114//-----------------------------------------------------------------------------
115
116class HP_Parser : public wxHtmlParser
117{
211dfedd 118public:
67c276bd
VS
119 HP_Parser()
120 {
121 GetEntitiesParser()->SetEncoding(wxFONTENCODING_ISO8859_1);
122 }
fc7a2a60 123
211dfedd 124 wxObject* GetProduct() { return NULL; }
fc7a2a60 125
211dfedd 126protected:
5bce3e6f 127 virtual void AddText(const wxString& WXUNUSED(txt)) {}
fc7a2a60 128
c0c133e1 129 wxDECLARE_NO_COPY_CLASS(HP_Parser);
8ec2b484
HH
130};
131
132
133//-----------------------------------------------------------------------------
134// HP_TagHandler
135//-----------------------------------------------------------------------------
136
137class HP_TagHandler : public wxHtmlTagHandler
138{
139 private:
91fa114d
VS
140 wxString m_name, m_page;
141 int m_level;
142 int m_id;
143 int m_index;
144 int m_count;
145 wxHtmlHelpDataItem *m_parentItem;
146 wxHtmlBookRecord *m_book;
d1da8872 147
91fa114d 148 wxHtmlHelpDataItems *m_data;
8ec2b484
HH
149
150 public:
04dbb646 151 HP_TagHandler(wxHtmlBookRecord *b) : wxHtmlTagHandler()
91fa114d
VS
152 {
153 m_data = NULL;
154 m_book = b;
155 m_name = m_page = wxEmptyString;
156 m_level = 0;
d1da8872 157 m_id = wxID_ANY;
91fa114d
VS
158 m_count = 0;
159 m_parentItem = NULL;
160 }
66a77a74 161 wxString GetSupportedTags() { return wxT("UL,OBJECT,PARAM"); }
8ec2b484 162 bool HandleTag(const wxHtmlTag& tag);
91fa114d
VS
163
164 void Reset(wxHtmlHelpDataItems& data)
165 {
166 m_data = &data;
167 m_count = 0;
168 m_level = 0;
169 m_parentItem = NULL;
170 }
22f3361e 171
c0c133e1 172 wxDECLARE_NO_COPY_CLASS(HP_TagHandler);
8ec2b484
HH
173};
174
175
176bool HP_TagHandler::HandleTag(const wxHtmlTag& tag)
177{
04dbb646 178 if (tag.GetName() == wxT("UL"))
4f9297b0 179 {
91fa114d
VS
180 wxHtmlHelpDataItem *oldparent = m_parentItem;
181 m_level++;
182 m_parentItem = (m_count > 0) ? &(*m_data)[m_data->size()-1] : NULL;
8ec2b484 183 ParseInner(tag);
91fa114d
VS
184 m_level--;
185 m_parentItem = oldparent;
186 return true;
8ec2b484 187 }
04dbb646 188 else if (tag.GetName() == wxT("OBJECT"))
4f9297b0 189 {
91fa114d 190 m_name = m_page = wxEmptyString;
8ec2b484 191 ParseInner(tag);
50494a55 192
daa084c2 193#if 0
91fa114d 194 if (!page.IsEmpty())
7df9fbc3 195 /* Valid HHW's file may contain only two object tags:
04dbb646 196
4157f43f
VS
197 <OBJECT type="text/site properties">
198 <param name="ImageType" value="Folder">
199 </OBJECT>
04dbb646 200
4157f43f 201 or
04dbb646
VZ
202
203 <OBJECT type="text/sitemap">
204 <param name="Name" value="main page">
205 <param name="Local" value="another.htm">
206 </OBJECT>
207
91fa114d 208 We're interested in the latter. !page.IsEmpty() is valid
4157f43f
VS
209 condition because text/site properties does not contain Local param
210 */
daa084c2
VS
211#endif
212 if (tag.GetParam(wxT("TYPE")) == wxT("text/sitemap"))
4157f43f 213 {
91fa114d
VS
214 wxHtmlHelpDataItem *item = new wxHtmlHelpDataItem();
215 item->parent = m_parentItem;
216 item->level = m_level;
217 item->id = m_id;
218 item->page = m_page;
219 item->name = m_name;
d1da8872 220
91fa114d
VS
221 item->book = m_book;
222 m_data->Add(item);
223 m_count++;
4157f43f 224 }
50494a55 225
91fa114d 226 return true;
8ec2b484 227 }
04dbb646 228 else
4f9297b0 229 { // "PARAM"
91fa114d
VS
230 if (m_name.empty() && tag.GetParam(wxT("NAME")) == wxT("Name"))
231 m_name = tag.GetParam(wxT("VALUE"));
04dbb646 232 if (tag.GetParam(wxT("NAME")) == wxT("Local"))
91fa114d 233 m_page = tag.GetParam(wxT("VALUE"));
04dbb646 234 if (tag.GetParam(wxT("NAME")) == wxT("ID"))
91fa114d
VS
235 tag.GetParamAsInt(wxT("VALUE"), &m_id);
236 return false;
8ec2b484
HH
237 }
238}
239
240
8ec2b484
HH
241//-----------------------------------------------------------------------------
242// wxHtmlHelpData
243//-----------------------------------------------------------------------------
244
468ae730
VS
245wxString wxHtmlBookRecord::GetFullPath(const wxString &page) const
246{
d5bfe584 247 if (wxIsAbsolutePath(page) || page.Find(wxT("file:")) == 0)
468ae730
VS
248 return page;
249 else
250 return m_BasePath + page;
251}
252
91fa114d
VS
253wxString wxHtmlHelpDataItem::GetIndentedName() const
254{
255 wxString s;
256 for (int i = 1; i < level; i++)
9a83f860 257 s << wxT(" ");
91fa114d
VS
258 s << name;
259 return s;
260}
468ae730
VS
261
262
8ec2b484
HH
263IMPLEMENT_DYNAMIC_CLASS(wxHtmlHelpData, wxObject)
264
f42b1601 265wxHtmlHelpData::wxHtmlHelpData()
8ec2b484 266{
8ec2b484
HH
267}
268
269wxHtmlHelpData::~wxHtmlHelpData()
270{
8ec2b484
HH
271}
272
67c276bd
VS
273bool wxHtmlHelpData::LoadMSProject(wxHtmlBookRecord *book, wxFileSystem& fsys,
274 const wxString& indexfile,
275 const wxString& contentsfile)
8ec2b484
HH
276{
277 wxFSFile *f;
2b5f62a0 278 wxHtmlFilterHTML filter;
eb37e1d2 279 wxString buf;
8ec2b484 280 wxString string;
f42b1601 281
8ec2b484
HH
282 HP_Parser parser;
283 HP_TagHandler *handler = new HP_TagHandler(book);
284 parser.AddTagHandler(handler);
285
d3b9f782 286 f = ( contentsfile.empty() ? NULL : fsys.OpenFile(contentsfile) );
04dbb646 287 if (f)
4f9297b0 288 {
eb37e1d2 289 buf.clear();
2b5f62a0 290 buf = filter.ReadFile(*f);
8ec2b484 291 delete f;
91fa114d 292 handler->Reset(m_contents);
8ec2b484 293 parser.Parse(buf);
8ec2b484 294 }
f3c82859 295 else
2b5f62a0 296 {
f6bcfd97 297 wxLogError(_("Cannot open contents file: %s"), contentsfile.c_str());
2b5f62a0 298 }
8ec2b484 299
d3b9f782 300 f = ( indexfile.empty() ? NULL : fsys.OpenFile(indexfile) );
04dbb646 301 if (f)
4f9297b0 302 {
eb37e1d2 303 buf.clear();
2b5f62a0 304 buf = filter.ReadFile(*f);
8ec2b484 305 delete f;
91fa114d 306 handler->Reset(m_index);
8ec2b484 307 parser.Parse(buf);
8ec2b484 308 }
93763ad5 309 else if (!indexfile.empty())
2b5f62a0 310 {
f6bcfd97 311 wxLogError(_("Cannot open index file: %s"), indexfile.c_str());
2b5f62a0 312 }
d1da8872 313 return true;
8ec2b484
HH
314}
315
4fd5055c
VS
316inline static void CacheWriteInt32(wxOutputStream *f, wxInt32 value)
317{
318 wxInt32 x = wxINT32_SWAP_ON_BE(value);
319 f->Write(&x, sizeof(x));
320}
f35822af 321
4fd5055c
VS
322inline static wxInt32 CacheReadInt32(wxInputStream *f)
323{
324 wxInt32 x;
325 f->Read(&x, sizeof(x));
326 return wxINT32_SWAP_ON_BE(x);
327}
f35822af 328
3912b3f8 329inline static void CacheWriteString(wxOutputStream *f, const wxString& str)
d1da8872 330{
3912b3f8
VS
331 const wxWX2MBbuf mbstr = str.mb_str(wxConvUTF8);
332 size_t len = strlen((const char*)mbstr)+1;
4fd5055c 333 CacheWriteInt32(f, len);
3912b3f8 334 f->Write((const char*)mbstr, len);
4fd5055c 335}
f35822af 336
3912b3f8 337inline static wxString CacheReadString(wxInputStream *f)
4fd5055c 338{
4fd5055c 339 size_t len = (size_t)CacheReadInt32(f);
3912b3f8
VS
340 wxCharBuffer str(len-1);
341 f->Read(str.data(), len);
342 return wxString(str, wxConvUTF8);
4fd5055c 343}
f35822af 344
91fa114d 345#define CURRENT_CACHED_BOOK_VERSION 5
d1a9c82b
VS
346
347// Additional flags to detect incompatibilities of the runtime environment:
348#define CACHED_BOOK_FORMAT_FLAGS \
349 (wxUSE_UNICODE << 0)
350
f35822af 351
8ec2b484
HH
352bool wxHtmlHelpData::LoadCachedBook(wxHtmlBookRecord *book, wxInputStream *f)
353{
91fa114d 354 int i, st, newsize;
f35822af
VS
355 wxInt32 version;
356
357 /* load header - version info : */
4fd5055c 358 version = CacheReadInt32(f);
d1da8872 359
04dbb646 360 if (version != CURRENT_CACHED_BOOK_VERSION)
f3c82859 361 {
d1da8872 362 // NB: We can just silently return false here and don't worry about
4fd5055c 363 // it anymore, because AddBookParam will load the MS project in
d1da8872 364 // absence of (properly versioned) .cached file and automatically
4fd5055c 365 // create new .cached file immediately afterward.
91fa114d 366 return false;
f3c82859 367 }
04dbb646 368
d1a9c82b 369 if (CacheReadInt32(f) != CACHED_BOOK_FORMAT_FLAGS)
91fa114d 370 return false;
d1a9c82b 371
8ec2b484 372 /* load contents : */
91fa114d
VS
373 st = m_contents.size();
374 newsize = st + CacheReadInt32(f);
375 m_contents.Alloc(newsize);
376 for (i = st; i < newsize; i++)
4f9297b0 377 {
91fa114d
VS
378 wxHtmlHelpDataItem *item = new wxHtmlHelpDataItem;
379 item->level = CacheReadInt32(f);
380 item->id = CacheReadInt32(f);
381 item->name = CacheReadString(f);
382 item->page = CacheReadString(f);
383 item->book = book;
384 m_contents.Add(item);
8ec2b484
HH
385 }
386
387 /* load index : */
91fa114d
VS
388 st = m_index.size();
389 newsize = st + CacheReadInt32(f);
390 m_index.Alloc(newsize);
391 for (i = st; i < newsize; i++)
4f9297b0 392 {
91fa114d
VS
393 wxHtmlHelpDataItem *item = new wxHtmlHelpDataItem;
394 item->name = CacheReadString(f);
395 item->page = CacheReadString(f);
396 item->level = CacheReadInt32(f);
397 item->book = book;
398 int parentShift = CacheReadInt32(f);
399 if (parentShift != 0)
400 item->parent = &m_index[m_index.size() - parentShift];
401 m_index.Add(item);
8ec2b484 402 }
91fa114d 403 return true;
8ec2b484
HH
404}
405
406
407bool wxHtmlHelpData::SaveCachedBook(wxHtmlBookRecord *book, wxOutputStream *f)
408{
409 int i;
4fd5055c 410 wxInt32 cnt;
f35822af
VS
411
412 /* save header - version info : */
4fd5055c 413 CacheWriteInt32(f, CURRENT_CACHED_BOOK_VERSION);
d1a9c82b 414 CacheWriteInt32(f, CACHED_BOOK_FORMAT_FLAGS);
8ec2b484
HH
415
416 /* save contents : */
91fa114d 417 int len = m_contents.size();
d1da8872 418 for (cnt = 0, i = 0; i < len; i++)
91fa114d 419 if (m_contents[i].book == book && m_contents[i].level > 0)
4fd5055c
VS
420 cnt++;
421 CacheWriteInt32(f, cnt);
8ec2b484 422
91fa114d 423 for (i = 0; i < len; i++)
4f9297b0 424 {
d1da8872 425 if (m_contents[i].book != book || m_contents[i].level == 0)
4fd5055c 426 continue;
91fa114d
VS
427 CacheWriteInt32(f, m_contents[i].level);
428 CacheWriteInt32(f, m_contents[i].id);
429 CacheWriteString(f, m_contents[i].name);
430 CacheWriteString(f, m_contents[i].page);
8ec2b484
HH
431 }
432
433 /* save index : */
91fa114d 434 len = m_index.size();
d1da8872
WS
435 for (cnt = 0, i = 0; i < len; i++)
436 if (m_index[i].book == book && m_index[i].level > 0)
4fd5055c
VS
437 cnt++;
438 CacheWriteInt32(f, cnt);
8ec2b484 439
91fa114d 440 for (i = 0; i < len; i++)
4f9297b0 441 {
d1da8872 442 if (m_index[i].book != book || m_index[i].level == 0)
4fd5055c 443 continue;
91fa114d
VS
444 CacheWriteString(f, m_index[i].name);
445 CacheWriteString(f, m_index[i].page);
446 CacheWriteInt32(f, m_index[i].level);
447 // save distance to parent item, if any:
448 if (m_index[i].parent == NULL)
449 {
450 CacheWriteInt32(f, 0);
451 }
452 else
453 {
17a1ebd1 454 int cnt2 = 0;
91fa114d
VS
455 wxHtmlHelpDataItem *parent = m_index[i].parent;
456 for (int j = i-1; j >= 0; j--)
457 {
458 if (m_index[j].book == book && m_index[j].level > 0)
17a1ebd1 459 cnt2++;
91fa114d
VS
460 if (&m_index[j] == parent)
461 break;
462 }
17a1ebd1
VZ
463 wxASSERT(cnt2 > 0);
464 CacheWriteInt32(f, cnt2);
91fa114d 465 }
8ec2b484 466 }
91fa114d 467 return true;
8ec2b484
HH
468}
469
470
471void wxHtmlHelpData::SetTempDir(const wxString& path)
472{
91fa114d
VS
473 if (path.empty())
474 m_tempPath = path;
04dbb646 475 else
4f9297b0 476 {
0d53638f
VZ
477 wxFileName fn;
478 fn.AssignDir(path);
ec2c85bf 479 fn.MakeAbsolute();
8ec2b484 480
ec2c85bf 481 m_tempPath = fn.GetPath(wxPATH_GET_VOLUME | wxPATH_GET_SEPARATOR);
8ec2b484
HH
482 }
483}
484
485
29e60597
VS
486
487static wxString SafeFileName(const wxString& s)
488{
489 wxString res(s);
490 res.Replace(wxT("#"), wxT("_"));
491 res.Replace(wxT(":"), wxT("_"));
492 res.Replace(wxT("\\"), wxT("_"));
493 res.Replace(wxT("/"), wxT("_"));
494 return res;
495}
496
f35822af 497bool wxHtmlHelpData::AddBookParam(const wxFSFile& bookfile,
f890e2d4 498 wxFontEncoding encoding,
f35822af 499 const wxString& title, const wxString& contfile,
d5bb85a0
VS
500 const wxString& indexfile, const wxString& deftopic,
501 const wxString& path)
8ec2b484 502{
6a63bdc8
JS
503#if wxUSE_WCHAR_T
504 #if wxUSE_UNICODE
505 #define CORRECT_STR(str, conv) \
506 str = wxString((str).mb_str(wxConvISO8859_1), conv)
507 #else
508 #define CORRECT_STR(str, conv) \
509 str = wxString((str).wc_str(conv), wxConvLocal)
510 #endif
511#else
512 #define CORRECT_STR(str, conv)
513#endif
514
8ec2b484
HH
515 wxFileSystem fsys;
516 wxFSFile *fi;
517 wxHtmlBookRecord *bookr;
04dbb646 518
91fa114d
VS
519 int IndexOld = m_index.size(),
520 ContentsOld = m_contents.size();
f42b1601 521
93763ad5 522 if (!path.empty())
d1da8872 523 fsys.ChangePathTo(path, true);
8ec2b484 524
91fa114d 525 size_t booksCnt = m_bookRecords.GetCount();
5ecdcaa7
VS
526 for (size_t i = 0; i < booksCnt; i++)
527 {
91fa114d
VS
528 if ( m_bookRecords[i].GetBookFile() == bookfile.GetLocation() )
529 return true; // book is (was) loaded
5ecdcaa7
VS
530 }
531
6a63bdc8
JS
532 wxString title1 = title;
533 if (encoding != wxFONTENCODING_SYSTEM)
534 {
535 wxCSConv conv(encoding);
536 CORRECT_STR(title1, conv);
537 if (title1.IsEmpty() && !title.IsEmpty())
538 title1 = title;
539 }
540
541 bookr = new wxHtmlBookRecord(bookfile.GetLocation(), fsys.GetPath(), title1, deftopic);
d1da8872 542
91fa114d
VS
543 wxHtmlHelpDataItem *bookitem = new wxHtmlHelpDataItem;
544 bookitem->level = 0;
545 bookitem->id = 0;
546 bookitem->page = deftopic;
547 bookitem->name = title;
548 bookitem->book = bookr;
8ec2b484
HH
549
550 // store the contents index for later
91fa114d
VS
551 int cont_start = m_contents.size();
552
553 m_contents.Add(bookitem);
8ec2b484
HH
554
555 // Try to find cached binary versions:
f35822af
VS
556 // 1. save file as book, but with .hhp.cached extension
557 // 2. same as 1. but in temp path
558 // 3. otherwise or if cache load failed, load it from MS.
04dbb646 559
f35822af 560 fi = fsys.OpenFile(bookfile.GetLocation() + wxT(".cached"));
04dbb646
VZ
561
562 if (fi == NULL ||
e2b87f38 563#if wxUSE_DATETIME
04dbb646 564 fi->GetModificationTime() < bookfile.GetModificationTime() ||
e2b87f38 565#endif // wxUSE_DATETIME
4f9297b0 566 !LoadCachedBook(bookr, fi->GetStream()))
f35822af
VS
567 {
568 if (fi != NULL) delete fi;
91fa114d
VS
569 fi = fsys.OpenFile(m_tempPath + wxFileNameFromPath(bookfile.GetLocation()) + wxT(".cached"));
570 if (m_tempPath.empty() || fi == NULL ||
e2b87f38 571#if wxUSE_DATETIME
04dbb646 572 fi->GetModificationTime() < bookfile.GetModificationTime() ||
e2b87f38 573#endif // wxUSE_DATETIME
4f9297b0 574 !LoadCachedBook(bookr, fi->GetStream()))
f35822af
VS
575 {
576 LoadMSProject(bookr, fsys, indexfile, contfile);
91fa114d 577 if (!m_tempPath.empty())
f35822af 578 {
91fa114d 579 wxFileOutputStream *outs = new wxFileOutputStream(m_tempPath +
29e60597 580 SafeFileName(wxFileNameFromPath(bookfile.GetLocation())) + wxT(".cached"));
f35822af
VS
581 SaveCachedBook(bookr, outs);
582 delete outs;
583 }
d5bb85a0 584 }
8ec2b484 585 }
04dbb646 586
f35822af 587 if (fi != NULL) delete fi;
8ec2b484
HH
588
589 // Now store the contents range
91fa114d 590 bookr->SetContentsRange(cont_start, m_contents.size());
04dbb646 591
3912b3f8
VS
592 // MS HTML Help files [written by MS HTML Help Workshop] are broken
593 // in that the data are iso-8859-1 (including HTML entities), but must
594 // be interpreted as being in language's windows charset. Correct the
595 // differences here and also convert to wxConvLocal in ANSI build
67c276bd 596 if (encoding != wxFONTENCODING_SYSTEM)
3912b3f8 597 {
67c276bd 598 wxCSConv conv(encoding);
91fa114d
VS
599 size_t IndexCnt = m_index.size();
600 size_t ContentsCnt = m_contents.size();
601 size_t i;
602 for (i = IndexOld; i < IndexCnt; i++)
f890e2d4 603 {
91fa114d 604 CORRECT_STR(m_index[i].name, conv);
f890e2d4 605 }
91fa114d 606 for (i = ContentsOld; i < ContentsCnt; i++)
3912b3f8 607 {
91fa114d 608 CORRECT_STR(m_contents[i].name, conv);
3912b3f8
VS
609 }
610 #undef CORRECT_STR
f890e2d4 611 }
8ec2b484 612
91fa114d
VS
613 m_bookRecords.Add(bookr);
614 if (!m_index.empty())
615 {
616 m_index.Sort(wxHtmlHelpIndexCompareFunc);
617 }
f42b1601 618
91fa114d 619 return true;
8ec2b484
HH
620}
621
622
623bool wxHtmlHelpData::AddBook(const wxString& book)
624{
3527f29c
VS
625 wxString extension(book.Right(4).Lower());
626 if (extension == wxT(".zip") ||
627#if wxUSE_LIBMSPACK
628 extension == wxT(".chm") /*compressed html help book*/ ||
629#endif
630 extension == wxT(".htb") /*html book*/)
68364659
VS
631 {
632 wxFileSystem fsys;
633 wxString s;
d1da8872 634 bool rt = false;
68364659 635
3527f29c
VS
636#if wxUSE_LIBMSPACK
637 if (extension == wxT(".chm"))
638 s = fsys.FindFirst(book + wxT("#chm:*.hhp"), wxFILE);
639 else
640#endif
641 s = fsys.FindFirst(book + wxT("#zip:*.hhp"), wxFILE);
642
93763ad5 643 while (!s.empty())
68364659 644 {
d1da8872 645 if (AddBook(s)) rt = true;
68364659
VS
646 s = fsys.FindNext();
647 }
04dbb646 648
68364659
VS
649 return rt;
650 }
68364659 651
a509f830
VZ
652 wxFSFile *fi;
653 wxFileSystem fsys;
3dde6c72 654
a509f830
VZ
655 wxString title = _("noname"),
656 safetitle,
657 start = wxEmptyString,
658 contents = wxEmptyString,
659 index = wxEmptyString,
660 charset = wxEmptyString;
68364659 661
a509f830
VZ
662 fi = fsys.OpenFile(book);
663 if (fi == NULL)
664 {
665 wxLogError(_("Cannot open HTML help book: %s"), book.c_str());
d1da8872 666 return false;
68364659 667 }
a509f830
VZ
668 fsys.ChangePathTo(book);
669
670 const wxChar *lineptr;
671 wxChar linebuf[300];
672 wxString tmp;
673 wxHtmlFilterPlainText filter;
674 tmp = filter.ReadFile(*fi);
675 lineptr = tmp.c_str();
676
d1da8872 677 do
a509f830
VZ
678 {
679 lineptr = ReadLine(lineptr, linebuf, 300);
d1da8872 680
a509f830 681 for (wxChar *ch = linebuf; *ch != wxT('\0') && *ch != wxT('='); ch++)
42841dfc 682 *ch = (wxChar)wxTolower(*ch);
a509f830 683
9a83f860
VZ
684 if (wxStrstr(linebuf, wxT("title=")) == linebuf)
685 title = linebuf + wxStrlen(wxT("title="));
686 if (wxStrstr(linebuf, wxT("default topic=")) == linebuf)
687 start = linebuf + wxStrlen(wxT("default topic="));
688 if (wxStrstr(linebuf, wxT("index file=")) == linebuf)
689 index = linebuf + wxStrlen(wxT("index file="));
690 if (wxStrstr(linebuf, wxT("contents file=")) == linebuf)
691 contents = linebuf + wxStrlen(wxT("contents file="));
692 if (wxStrstr(linebuf, wxT("charset=")) == linebuf)
693 charset = linebuf + wxStrlen(wxT("charset="));
a509f830 694 } while (lineptr != NULL);
d1da8872 695
5a969262
RR
696 wxFontEncoding enc = wxFONTENCODING_SYSTEM;
697#if wxUSE_FONTMAP
698 if (charset != wxEmptyString)
699 enc = wxFontMapper::Get()->CharsetToEncoding(charset);
700#endif
a509f830 701
67c276bd 702 bool rtval = AddBookParam(*fi, enc,
a509f830
VZ
703 title, contents, index, start, fsys.GetPath());
704 delete fi;
91fa114d 705
a509f830 706 return rtval;
8ec2b484
HH
707}
708
709wxString wxHtmlHelpData::FindPageByName(const wxString& x)
710{
8ec2b484 711 int i;
8ec2b484 712
8680ee06
RR
713 bool has_non_ascii = false;
714 wxString::const_iterator it;
715 for (it = x.begin(); it != x.end(); ++it)
716 {
717 wxUniChar ch = *it;
718 if (!ch.IsAscii())
719 {
720 has_non_ascii = true;
721 break;
722 }
723 }
03647350 724
8680ee06 725 int cnt = m_bookRecords.GetCount();
03647350 726
8680ee06 727 if (!has_non_ascii)
4f9297b0 728 {
8680ee06
RR
729 wxFileSystem fsys;
730 wxFSFile *f;
731 // 1. try to open given file:
732 for (i = 0; i < cnt; i++)
733 {
91fa114d 734 f = fsys.OpenFile(m_bookRecords[i].GetFullPath(x));
04dbb646
VZ
735 if (f)
736 {
91fa114d 737 wxString url = m_bookRecords[i].GetFullPath(x);
8ec2b484
HH
738 delete f;
739 return url;
740 }
8680ee06 741 }
8ec2b484
HH
742 }
743
744
735a74df 745 // 2. try to find a book:
04dbb646 746 for (i = 0; i < cnt; i++)
4f9297b0 747 {
91fa114d
VS
748 if (m_bookRecords[i].GetTitle() == x)
749 return m_bookRecords[i].GetFullPath(m_bookRecords[i].GetStart());
8ec2b484
HH
750 }
751
735a74df 752 // 3. try to find in contents:
91fa114d 753 cnt = m_contents.size();
04dbb646 754 for (i = 0; i < cnt; i++)
4f9297b0 755 {
91fa114d
VS
756 if (m_contents[i].name == x)
757 return m_contents[i].GetFullPath();
8ec2b484
HH
758 }
759
760
735a74df 761 // 4. try to find in index:
91fa114d 762 cnt = m_index.size();
04dbb646 763 for (i = 0; i < cnt; i++)
4f9297b0 764 {
91fa114d
VS
765 if (m_index[i].name == x)
766 return m_index[i].GetFullPath();
8ec2b484
HH
767 }
768
735a74df
VZ
769 // 4b. if still not found, try case-insensitive comparison
770 for (i = 0; i < cnt; i++)
771 {
772 if (m_index[i].name.CmpNoCase(x) == 0)
773 return m_index[i].GetFullPath();
774 }
775
91fa114d 776 return wxEmptyString;
8ec2b484
HH
777}
778
779wxString wxHtmlHelpData::FindPageById(int id)
f42b1601 780{
91fa114d
VS
781 size_t cnt = m_contents.size();
782 for (size_t i = 0; i < cnt; i++)
4f9297b0 783 {
91fa114d 784 if (m_contents[i].id == id)
04dbb646 785 {
91fa114d 786 return m_contents[i].GetFullPath();
8ec2b484
HH
787 }
788 }
789
91fa114d
VS
790 return wxEmptyString;
791}
792
91fa114d 793
8ec2b484
HH
794//----------------------------------------------------------------------------------
795// wxHtmlSearchStatus functions
796//----------------------------------------------------------------------------------
797
798wxHtmlSearchStatus::wxHtmlSearchStatus(wxHtmlHelpData* data, const wxString& keyword,
c4971147 799 bool case_sensitive, bool whole_words_only,
d5bb85a0 800 const wxString& book)
8ec2b484
HH
801{
802 m_Data = data;
803 m_Keyword = keyword;
804 wxHtmlBookRecord* bookr = NULL;
04dbb646 805 if (book != wxEmptyString)
4f9297b0 806 {
d5bb85a0 807 // we have to search in a specific book. Find it first
91fa114d 808 int i, cnt = data->m_bookRecords.GetCount();
d5bb85a0 809 for (i = 0; i < cnt; i++)
91fa114d 810 if (data->m_bookRecords[i].GetTitle() == book)
04dbb646 811 {
91fa114d 812 bookr = &(data->m_bookRecords[i]);
d5bb85a0
VS
813 m_CurIndex = bookr->GetContentsStart();
814 m_MaxIndex = bookr->GetContentsEnd();
815 break;
816 }
817 // check; we won't crash if the book doesn't exist, but it's Bad Anyway.
818 wxASSERT(bookr);
8ec2b484 819 }
04dbb646 820 if (! bookr)
4f9297b0 821 {
d5bb85a0
VS
822 // no book specified; search all books
823 m_CurIndex = 0;
91fa114d 824 m_MaxIndex = m_Data->m_contents.size();
8ec2b484 825 }
c4971147 826 m_Engine.LookFor(keyword, case_sensitive, whole_words_only);
8ec2b484 827 m_Active = (m_CurIndex < m_MaxIndex);
8ec2b484
HH
828}
829
830bool wxHtmlSearchStatus::Search()
831{
8ec2b484 832 wxFSFile *file;
d5bb85a0 833 int i = m_CurIndex; // shortcut
91fa114d 834 bool found = false;
3912b3f8 835 wxString thepage;
8ec2b484 836
04dbb646 837 if (!m_Active)
4f9297b0 838 {
f35822af 839 // sanity check. Illegal use, but we'll try to prevent a crash anyway
50494a55 840 wxASSERT(m_Active);
91fa114d 841 return false;
8ec2b484
HH
842 }
843
8ec2b484 844 m_Name = wxEmptyString;
91fa114d
VS
845 m_CurItem = NULL;
846 thepage = m_Data->m_contents[i].page;
8ec2b484 847
b5a7b000
VS
848 m_Active = (++m_CurIndex < m_MaxIndex);
849 // check if it is same page with different anchor:
3912b3f8 850 if (!m_LastPage.empty())
b5a7b000 851 {
3912b3f8
VS
852 const wxChar *p1, *p2;
853 for (p1 = thepage.c_str(), p2 = m_LastPage.c_str();
9a83f860 854 *p1 != 0 && *p1 != wxT('#') && *p1 == *p2; p1++, p2++) {}
b5a7b000
VS
855
856 m_LastPage = thepage;
857
9a83f860 858 if (*p1 == 0 || *p1 == wxT('#'))
3912b3f8 859 return false;
b5a7b000
VS
860 }
861 else m_LastPage = thepage;
04dbb646 862
f35822af 863 wxFileSystem fsys;
91fa114d 864 file = fsys.OpenFile(m_Data->m_contents[i].book->GetFullPath(thepage));
04dbb646 865 if (file)
b5a7b000 866 {
2b5f62a0 867 if (m_Engine.Scan(*file))
468ae730 868 {
91fa114d
VS
869 m_Name = m_Data->m_contents[i].name;
870 m_CurItem = &m_Data->m_contents[i];
871 found = true;
d5bb85a0
VS
872 }
873 delete file;
8ec2b484 874 }
8ec2b484
HH
875 return found;
876}
877
d5bb85a0
VS
878
879
880
881
882
883
884
885//--------------------------------------------------------------------------------
2b5f62a0 886// wxHtmlSearchEngine
d5bb85a0
VS
887//--------------------------------------------------------------------------------
888
2b5f62a0 889void wxHtmlSearchEngine::LookFor(const wxString& keyword, bool case_sensitive, bool whole_words_only)
d5bb85a0 890{
c4971147
VS
891 m_CaseSensitive = case_sensitive;
892 m_WholeWords = whole_words_only;
3912b3f8 893 m_Keyword = keyword;
04dbb646 894
3444e4a8 895 if (!m_CaseSensitive)
3912b3f8 896 m_Keyword.LowerCase();
d5bb85a0
VS
897}
898
899
1a1dac18
MB
900static inline bool WHITESPACE(wxChar c)
901{
9a83f860 902 return c == wxT(' ') || c == wxT('\n') || c == wxT('\r') || c == wxT('\t');
1a1dac18 903}
c4971147 904
21dc4638
VZ
905// replace continuous spaces by one single space
906static inline wxString CompressSpaces(const wxString & str)
907{
908 wxString buf;
909 buf.reserve( str.size() );
910
911 bool space_counted = false;
912 for( const wxChar * pstr = str.c_str(); *pstr; ++pstr )
913 {
914 wxChar ch = *pstr;
915 if( WHITESPACE( ch ) )
916 {
917 if( space_counted )
918 {
919 continue;
920 }
9a83f860 921 ch = wxT(' ');
21dc4638
VZ
922 space_counted = true;
923 }
924 else
925 {
926 space_counted = false;
927 }
928 buf += ch;
929 }
930
931 return buf;
932}
933
2b5f62a0 934bool wxHtmlSearchEngine::Scan(const wxFSFile& file)
d5bb85a0 935{
3912b3f8 936 wxASSERT_MSG(!m_Keyword.empty(), wxT("wxHtmlSearchEngine::LookFor must be called before scanning!"));
d5bb85a0 937
2b5f62a0 938 wxHtmlFilterHTML filter;
21dc4638 939 wxString bufStr = filter.ReadFile(file);
d5bb85a0 940
c4971147 941 if (!m_CaseSensitive)
21dc4638 942 bufStr.LowerCase();
d5bb85a0 943
21dc4638
VZ
944 { // remove html tags
945 wxString bufStrCopy;
946 bufStrCopy.reserve( bufStr.size() );
947 bool insideTag = false;
948 for (const wxChar * pBufStr = bufStr.c_str(); *pBufStr; ++pBufStr)
04dbb646 949 {
21dc4638
VZ
950 wxChar c = *pBufStr;
951 if (insideTag)
952 {
9a83f860 953 if (c == wxT('>'))
21dc4638
VZ
954 {
955 insideTag = false;
956 // replace the tag by an empty space
9a83f860 957 c = wxT(' ');
21dc4638
VZ
958 }
959 else
960 continue;
961 }
9a83f860 962 else if (c == wxT('<'))
21dc4638
VZ
963 {
964 wxChar nextCh = *(pBufStr + 1);
9a83f860 965 if (nextCh == wxT('/') || !WHITESPACE(nextCh))
21dc4638
VZ
966 {
967 insideTag = true;
968 continue;
969 }
970 }
971 bufStrCopy += c;
c4971147 972 }
21dc4638 973 bufStr.swap( bufStrCopy );
c4971147 974 }
04dbb646 975
21dc4638
VZ
976 wxString keyword = m_Keyword;
977
978 if (m_WholeWords)
c4971147 979 {
21dc4638 980 // insert ' ' at the beginning and at the end
9a83f860
VZ
981 keyword.insert( 0, wxT(" ") );
982 keyword.append( wxT(" ") );
983 bufStr.insert( 0, wxT(" ") );
984 bufStr.append( wxT(" ") );
d5bb85a0
VS
985 }
986
21dc4638
VZ
987 // remove continuous spaces
988 keyword = CompressSpaces( keyword );
989 bufStr = CompressSpaces( bufStr );
d5bb85a0 990
21dc4638
VZ
991 // finally do the search
992 return bufStr.find( keyword ) != wxString::npos;
993}
d5bb85a0 994
8ec2b484 995#endif