]> git.saurik.com Git - wxWidgets.git/blame - src/html/helpdata.cpp
Fix FileTestCase to really test strings with embedded NULs.
[wxWidgets.git] / src / html / helpdata.cpp
CommitLineData
8ec2b484 1/////////////////////////////////////////////////////////////////////////////
93763ad5 2// Name: src/html/helpdata.cpp
8ec2b484 3// Purpose: wxHtmlHelpData
f42b1601 4// Notes: Based on htmlhelp.cpp, implementing a monolithic
8ec2b484
HH
5// HTML Help controller class, by Vaclav Slavik
6// Author: Harm van der Heijden and Vaclav Slavik
69941f05 7// RCS-ID: $Id$
8ec2b484 8// Copyright: (c) Harm van der Heijden and Vaclav Slavik
65571936 9// Licence: wxWindows licence
8ec2b484
HH
10/////////////////////////////////////////////////////////////////////////////
11
8ec2b484
HH
12// For compilers that support precompilation, includes "wx.h".
13#include "wx/wxprec.h"
14
15#ifdef __BORLANDC__
93763ad5 16 #pragma hdrstop
8ec2b484
HH
17#endif
18
f6bcfd97 19#if wxUSE_HTML && wxUSE_STREAMS
8ec2b484 20
b4f4d3dd 21#ifndef WX_PRECOMP
04dbb646
VZ
22 #include "wx/intl.h"
23 #include "wx/log.h"
8ec2b484
HH
24#endif
25
401eb3de
RR
26#include <ctype.h>
27
8ec2b484
HH
28#include "wx/html/helpdata.h"
29#include "wx/tokenzr.h"
30#include "wx/wfstream.h"
31#include "wx/busyinfo.h"
f890e2d4
VS
32#include "wx/encconv.h"
33#include "wx/fontmap.h"
69941f05 34#include "wx/html/htmlpars.h"
8ec2b484 35#include "wx/html/htmldefs.h"
2b5f62a0 36#include "wx/html/htmlfilt.h"
057b55b0 37#include "wx/filename.h"
8ec2b484
HH
38
39#include "wx/arrimpl.cpp"
40WX_DEFINE_OBJARRAY(wxHtmlBookRecArray)
91fa114d 41WX_DEFINE_OBJARRAY(wxHtmlHelpDataItems)
8ec2b484
HH
42
43//-----------------------------------------------------------------------------
44// static helper functions
45//-----------------------------------------------------------------------------
46
47// Reads one line, stores it into buf and returns pointer to new line or NULL.
1a1dac18 48static const wxChar* ReadLine(const wxChar *line, wxChar *buf, size_t bufsize)
8ec2b484 49{
1a1dac18
MB
50 wxChar *writeptr = buf;
51 wxChar *endptr = buf + bufsize - 1;
52 const wxChar *readptr = line;
8ec2b484 53
9a83f860 54 while (*readptr != 0 && *readptr != wxT('\r') && *readptr != wxT('\n') &&
d1da8872 55 writeptr != endptr)
3dde6c72 56 *(writeptr++) = *(readptr++);
8ec2b484 57 *writeptr = 0;
9a83f860 58 while (*readptr == wxT('\r') || *readptr == wxT('\n'))
3dde6c72
VS
59 readptr++;
60 if (*readptr == 0)
61 return NULL;
d1da8872 62 else
3dde6c72 63 return readptr;
8ec2b484
HH
64}
65
66
8ec2b484 67
91fa114d
VS
68static int
69wxHtmlHelpIndexCompareFunc(wxHtmlHelpDataItem **a, wxHtmlHelpDataItem **b)
8ec2b484 70{
91fa114d
VS
71 wxHtmlHelpDataItem *ia = *a;
72 wxHtmlHelpDataItem *ib = *b;
3912b3f8 73
7fbe5489
VS
74 if (ia == NULL)
75 return -1;
76 if (ib == NULL)
77 return 1;
42841dfc 78
91fa114d
VS
79 if (ia->parent == ib->parent)
80 {
81 return ia->name.CmpNoCase(ib->name);
82 }
83 else if (ia->level == ib->level)
84 {
85 return wxHtmlHelpIndexCompareFunc(&ia->parent, &ib->parent);
86 }
87 else
88 {
89 wxHtmlHelpDataItem *ia2 = ia;
90 wxHtmlHelpDataItem *ib2 = ib;
d1da8872 91
91fa114d
VS
92 while (ia2->level > ib2->level)
93 {
94 ia2 = ia2->parent;
95 }
96 while (ib2->level > ia2->level)
97 {
98 ib2 = ib2->parent;
99 }
d1da8872 100
91fa114d
VS
101 wxASSERT(ia2);
102 wxASSERT(ib2);
103 int res = wxHtmlHelpIndexCompareFunc(&ia2, &ib2);
104 if (res != 0)
105 return res;
106 else if (ia->level > ib->level)
107 return 1;
108 else
109 return -1;
110 }
8ec2b484
HH
111}
112
8ec2b484
HH
113//-----------------------------------------------------------------------------
114// HP_Parser
115//-----------------------------------------------------------------------------
116
117class HP_Parser : public wxHtmlParser
118{
211dfedd 119public:
67c276bd
VS
120 HP_Parser()
121 {
122 GetEntitiesParser()->SetEncoding(wxFONTENCODING_ISO8859_1);
123 }
fc7a2a60 124
211dfedd 125 wxObject* GetProduct() { return NULL; }
fc7a2a60 126
211dfedd 127protected:
5bce3e6f 128 virtual void AddText(const wxString& WXUNUSED(txt)) {}
fc7a2a60 129
c0c133e1 130 wxDECLARE_NO_COPY_CLASS(HP_Parser);
8ec2b484
HH
131};
132
133
134//-----------------------------------------------------------------------------
135// HP_TagHandler
136//-----------------------------------------------------------------------------
137
138class HP_TagHandler : public wxHtmlTagHandler
139{
140 private:
91fa114d
VS
141 wxString m_name, m_page;
142 int m_level;
143 int m_id;
144 int m_index;
145 int m_count;
146 wxHtmlHelpDataItem *m_parentItem;
147 wxHtmlBookRecord *m_book;
d1da8872 148
91fa114d 149 wxHtmlHelpDataItems *m_data;
8ec2b484
HH
150
151 public:
04dbb646 152 HP_TagHandler(wxHtmlBookRecord *b) : wxHtmlTagHandler()
91fa114d
VS
153 {
154 m_data = NULL;
155 m_book = b;
156 m_name = m_page = wxEmptyString;
157 m_level = 0;
d1da8872 158 m_id = wxID_ANY;
91fa114d
VS
159 m_count = 0;
160 m_parentItem = NULL;
161 }
66a77a74 162 wxString GetSupportedTags() { return wxT("UL,OBJECT,PARAM"); }
8ec2b484 163 bool HandleTag(const wxHtmlTag& tag);
91fa114d
VS
164
165 void Reset(wxHtmlHelpDataItems& data)
166 {
167 m_data = &data;
168 m_count = 0;
169 m_level = 0;
170 m_parentItem = NULL;
171 }
22f3361e 172
c0c133e1 173 wxDECLARE_NO_COPY_CLASS(HP_TagHandler);
8ec2b484
HH
174};
175
176
177bool HP_TagHandler::HandleTag(const wxHtmlTag& tag)
178{
04dbb646 179 if (tag.GetName() == wxT("UL"))
4f9297b0 180 {
91fa114d
VS
181 wxHtmlHelpDataItem *oldparent = m_parentItem;
182 m_level++;
183 m_parentItem = (m_count > 0) ? &(*m_data)[m_data->size()-1] : NULL;
8ec2b484 184 ParseInner(tag);
91fa114d
VS
185 m_level--;
186 m_parentItem = oldparent;
187 return true;
8ec2b484 188 }
04dbb646 189 else if (tag.GetName() == wxT("OBJECT"))
4f9297b0 190 {
91fa114d 191 m_name = m_page = wxEmptyString;
8ec2b484 192 ParseInner(tag);
50494a55 193
daa084c2 194#if 0
91fa114d 195 if (!page.IsEmpty())
7df9fbc3 196 /* Valid HHW's file may contain only two object tags:
04dbb646 197
4157f43f
VS
198 <OBJECT type="text/site properties">
199 <param name="ImageType" value="Folder">
200 </OBJECT>
04dbb646 201
4157f43f 202 or
04dbb646
VZ
203
204 <OBJECT type="text/sitemap">
205 <param name="Name" value="main page">
206 <param name="Local" value="another.htm">
207 </OBJECT>
208
91fa114d 209 We're interested in the latter. !page.IsEmpty() is valid
4157f43f
VS
210 condition because text/site properties does not contain Local param
211 */
daa084c2
VS
212#endif
213 if (tag.GetParam(wxT("TYPE")) == wxT("text/sitemap"))
4157f43f 214 {
91fa114d
VS
215 wxHtmlHelpDataItem *item = new wxHtmlHelpDataItem();
216 item->parent = m_parentItem;
217 item->level = m_level;
218 item->id = m_id;
219 item->page = m_page;
220 item->name = m_name;
d1da8872 221
91fa114d
VS
222 item->book = m_book;
223 m_data->Add(item);
224 m_count++;
4157f43f 225 }
50494a55 226
91fa114d 227 return true;
8ec2b484 228 }
04dbb646 229 else
4f9297b0 230 { // "PARAM"
91fa114d
VS
231 if (m_name.empty() && tag.GetParam(wxT("NAME")) == wxT("Name"))
232 m_name = tag.GetParam(wxT("VALUE"));
04dbb646 233 if (tag.GetParam(wxT("NAME")) == wxT("Local"))
91fa114d 234 m_page = tag.GetParam(wxT("VALUE"));
04dbb646 235 if (tag.GetParam(wxT("NAME")) == wxT("ID"))
91fa114d
VS
236 tag.GetParamAsInt(wxT("VALUE"), &m_id);
237 return false;
8ec2b484
HH
238 }
239}
240
241
8ec2b484
HH
242//-----------------------------------------------------------------------------
243// wxHtmlHelpData
244//-----------------------------------------------------------------------------
245
468ae730
VS
246wxString wxHtmlBookRecord::GetFullPath(const wxString &page) const
247{
248 if (wxIsAbsolutePath(page))
249 return page;
250 else
251 return m_BasePath + page;
252}
253
91fa114d
VS
254wxString wxHtmlHelpDataItem::GetIndentedName() const
255{
256 wxString s;
257 for (int i = 1; i < level; i++)
9a83f860 258 s << wxT(" ");
91fa114d
VS
259 s << name;
260 return s;
261}
468ae730
VS
262
263
8ec2b484
HH
264IMPLEMENT_DYNAMIC_CLASS(wxHtmlHelpData, wxObject)
265
f42b1601 266wxHtmlHelpData::wxHtmlHelpData()
8ec2b484 267{
8ec2b484
HH
268}
269
270wxHtmlHelpData::~wxHtmlHelpData()
271{
8ec2b484
HH
272}
273
67c276bd
VS
274bool wxHtmlHelpData::LoadMSProject(wxHtmlBookRecord *book, wxFileSystem& fsys,
275 const wxString& indexfile,
276 const wxString& contentsfile)
8ec2b484
HH
277{
278 wxFSFile *f;
2b5f62a0 279 wxHtmlFilterHTML filter;
eb37e1d2 280 wxString buf;
8ec2b484 281 wxString string;
f42b1601 282
8ec2b484
HH
283 HP_Parser parser;
284 HP_TagHandler *handler = new HP_TagHandler(book);
285 parser.AddTagHandler(handler);
286
d3b9f782 287 f = ( contentsfile.empty() ? NULL : fsys.OpenFile(contentsfile) );
04dbb646 288 if (f)
4f9297b0 289 {
eb37e1d2 290 buf.clear();
2b5f62a0 291 buf = filter.ReadFile(*f);
8ec2b484 292 delete f;
91fa114d 293 handler->Reset(m_contents);
8ec2b484 294 parser.Parse(buf);
8ec2b484 295 }
f3c82859 296 else
2b5f62a0 297 {
f6bcfd97 298 wxLogError(_("Cannot open contents file: %s"), contentsfile.c_str());
2b5f62a0 299 }
8ec2b484 300
d3b9f782 301 f = ( indexfile.empty() ? NULL : fsys.OpenFile(indexfile) );
04dbb646 302 if (f)
4f9297b0 303 {
eb37e1d2 304 buf.clear();
2b5f62a0 305 buf = filter.ReadFile(*f);
8ec2b484 306 delete f;
91fa114d 307 handler->Reset(m_index);
8ec2b484 308 parser.Parse(buf);
8ec2b484 309 }
93763ad5 310 else if (!indexfile.empty())
2b5f62a0 311 {
f6bcfd97 312 wxLogError(_("Cannot open index file: %s"), indexfile.c_str());
2b5f62a0 313 }
d1da8872 314 return true;
8ec2b484
HH
315}
316
4fd5055c
VS
317inline static void CacheWriteInt32(wxOutputStream *f, wxInt32 value)
318{
319 wxInt32 x = wxINT32_SWAP_ON_BE(value);
320 f->Write(&x, sizeof(x));
321}
f35822af 322
4fd5055c
VS
323inline static wxInt32 CacheReadInt32(wxInputStream *f)
324{
325 wxInt32 x;
326 f->Read(&x, sizeof(x));
327 return wxINT32_SWAP_ON_BE(x);
328}
f35822af 329
3912b3f8 330inline static void CacheWriteString(wxOutputStream *f, const wxString& str)
d1da8872 331{
3912b3f8
VS
332 const wxWX2MBbuf mbstr = str.mb_str(wxConvUTF8);
333 size_t len = strlen((const char*)mbstr)+1;
4fd5055c 334 CacheWriteInt32(f, len);
3912b3f8 335 f->Write((const char*)mbstr, len);
4fd5055c 336}
f35822af 337
3912b3f8 338inline static wxString CacheReadString(wxInputStream *f)
4fd5055c 339{
4fd5055c 340 size_t len = (size_t)CacheReadInt32(f);
3912b3f8
VS
341 wxCharBuffer str(len-1);
342 f->Read(str.data(), len);
343 return wxString(str, wxConvUTF8);
4fd5055c 344}
f35822af 345
91fa114d 346#define CURRENT_CACHED_BOOK_VERSION 5
d1a9c82b
VS
347
348// Additional flags to detect incompatibilities of the runtime environment:
349#define CACHED_BOOK_FORMAT_FLAGS \
350 (wxUSE_UNICODE << 0)
351
f35822af 352
8ec2b484
HH
353bool wxHtmlHelpData::LoadCachedBook(wxHtmlBookRecord *book, wxInputStream *f)
354{
91fa114d 355 int i, st, newsize;
f35822af
VS
356 wxInt32 version;
357
358 /* load header - version info : */
4fd5055c 359 version = CacheReadInt32(f);
d1da8872 360
04dbb646 361 if (version != CURRENT_CACHED_BOOK_VERSION)
f3c82859 362 {
d1da8872 363 // NB: We can just silently return false here and don't worry about
4fd5055c 364 // it anymore, because AddBookParam will load the MS project in
d1da8872 365 // absence of (properly versioned) .cached file and automatically
4fd5055c 366 // create new .cached file immediately afterward.
91fa114d 367 return false;
f3c82859 368 }
04dbb646 369
d1a9c82b 370 if (CacheReadInt32(f) != CACHED_BOOK_FORMAT_FLAGS)
91fa114d 371 return false;
d1a9c82b 372
8ec2b484 373 /* load contents : */
91fa114d
VS
374 st = m_contents.size();
375 newsize = st + CacheReadInt32(f);
376 m_contents.Alloc(newsize);
377 for (i = st; i < newsize; i++)
4f9297b0 378 {
91fa114d
VS
379 wxHtmlHelpDataItem *item = new wxHtmlHelpDataItem;
380 item->level = CacheReadInt32(f);
381 item->id = CacheReadInt32(f);
382 item->name = CacheReadString(f);
383 item->page = CacheReadString(f);
384 item->book = book;
385 m_contents.Add(item);
8ec2b484
HH
386 }
387
388 /* load index : */
91fa114d
VS
389 st = m_index.size();
390 newsize = st + CacheReadInt32(f);
391 m_index.Alloc(newsize);
392 for (i = st; i < newsize; i++)
4f9297b0 393 {
91fa114d
VS
394 wxHtmlHelpDataItem *item = new wxHtmlHelpDataItem;
395 item->name = CacheReadString(f);
396 item->page = CacheReadString(f);
397 item->level = CacheReadInt32(f);
398 item->book = book;
399 int parentShift = CacheReadInt32(f);
400 if (parentShift != 0)
401 item->parent = &m_index[m_index.size() - parentShift];
402 m_index.Add(item);
8ec2b484 403 }
91fa114d 404 return true;
8ec2b484
HH
405}
406
407
408bool wxHtmlHelpData::SaveCachedBook(wxHtmlBookRecord *book, wxOutputStream *f)
409{
410 int i;
4fd5055c 411 wxInt32 cnt;
f35822af
VS
412
413 /* save header - version info : */
4fd5055c 414 CacheWriteInt32(f, CURRENT_CACHED_BOOK_VERSION);
d1a9c82b 415 CacheWriteInt32(f, CACHED_BOOK_FORMAT_FLAGS);
8ec2b484
HH
416
417 /* save contents : */
91fa114d 418 int len = m_contents.size();
d1da8872 419 for (cnt = 0, i = 0; i < len; i++)
91fa114d 420 if (m_contents[i].book == book && m_contents[i].level > 0)
4fd5055c
VS
421 cnt++;
422 CacheWriteInt32(f, cnt);
8ec2b484 423
91fa114d 424 for (i = 0; i < len; i++)
4f9297b0 425 {
d1da8872 426 if (m_contents[i].book != book || m_contents[i].level == 0)
4fd5055c 427 continue;
91fa114d
VS
428 CacheWriteInt32(f, m_contents[i].level);
429 CacheWriteInt32(f, m_contents[i].id);
430 CacheWriteString(f, m_contents[i].name);
431 CacheWriteString(f, m_contents[i].page);
8ec2b484
HH
432 }
433
434 /* save index : */
91fa114d 435 len = m_index.size();
d1da8872
WS
436 for (cnt = 0, i = 0; i < len; i++)
437 if (m_index[i].book == book && m_index[i].level > 0)
4fd5055c
VS
438 cnt++;
439 CacheWriteInt32(f, cnt);
8ec2b484 440
91fa114d 441 for (i = 0; i < len; i++)
4f9297b0 442 {
d1da8872 443 if (m_index[i].book != book || m_index[i].level == 0)
4fd5055c 444 continue;
91fa114d
VS
445 CacheWriteString(f, m_index[i].name);
446 CacheWriteString(f, m_index[i].page);
447 CacheWriteInt32(f, m_index[i].level);
448 // save distance to parent item, if any:
449 if (m_index[i].parent == NULL)
450 {
451 CacheWriteInt32(f, 0);
452 }
453 else
454 {
17a1ebd1 455 int cnt2 = 0;
91fa114d
VS
456 wxHtmlHelpDataItem *parent = m_index[i].parent;
457 for (int j = i-1; j >= 0; j--)
458 {
459 if (m_index[j].book == book && m_index[j].level > 0)
17a1ebd1 460 cnt2++;
91fa114d
VS
461 if (&m_index[j] == parent)
462 break;
463 }
17a1ebd1
VZ
464 wxASSERT(cnt2 > 0);
465 CacheWriteInt32(f, cnt2);
91fa114d 466 }
8ec2b484 467 }
91fa114d 468 return true;
8ec2b484
HH
469}
470
471
472void wxHtmlHelpData::SetTempDir(const wxString& path)
473{
91fa114d
VS
474 if (path.empty())
475 m_tempPath = path;
04dbb646 476 else
4f9297b0 477 {
91fa114d 478 if (wxIsAbsolutePath(path)) m_tempPath = path;
9a83f860 479 else m_tempPath = wxGetCwd() + wxT("/") + path;
8ec2b484 480
9a83f860
VZ
481 if (m_tempPath[m_tempPath.length() - 1] != wxT('/'))
482 m_tempPath << wxT('/');
8ec2b484
HH
483 }
484}
485
486
29e60597
VS
487
488static wxString SafeFileName(const wxString& s)
489{
490 wxString res(s);
491 res.Replace(wxT("#"), wxT("_"));
492 res.Replace(wxT(":"), wxT("_"));
493 res.Replace(wxT("\\"), wxT("_"));
494 res.Replace(wxT("/"), wxT("_"));
495 return res;
496}
497
f35822af 498bool wxHtmlHelpData::AddBookParam(const wxFSFile& bookfile,
f890e2d4 499 wxFontEncoding encoding,
f35822af 500 const wxString& title, const wxString& contfile,
d5bb85a0
VS
501 const wxString& indexfile, const wxString& deftopic,
502 const wxString& path)
8ec2b484
HH
503{
504 wxFileSystem fsys;
505 wxFSFile *fi;
506 wxHtmlBookRecord *bookr;
04dbb646 507
91fa114d
VS
508 int IndexOld = m_index.size(),
509 ContentsOld = m_contents.size();
f42b1601 510
93763ad5 511 if (!path.empty())
d1da8872 512 fsys.ChangePathTo(path, true);
8ec2b484 513
91fa114d 514 size_t booksCnt = m_bookRecords.GetCount();
5ecdcaa7
VS
515 for (size_t i = 0; i < booksCnt; i++)
516 {
91fa114d
VS
517 if ( m_bookRecords[i].GetBookFile() == bookfile.GetLocation() )
518 return true; // book is (was) loaded
5ecdcaa7
VS
519 }
520
521 bookr = new wxHtmlBookRecord(bookfile.GetLocation(), fsys.GetPath(), title, deftopic);
d1da8872 522
91fa114d
VS
523 wxHtmlHelpDataItem *bookitem = new wxHtmlHelpDataItem;
524 bookitem->level = 0;
525 bookitem->id = 0;
526 bookitem->page = deftopic;
527 bookitem->name = title;
528 bookitem->book = bookr;
8ec2b484
HH
529
530 // store the contents index for later
91fa114d
VS
531 int cont_start = m_contents.size();
532
533 m_contents.Add(bookitem);
8ec2b484
HH
534
535 // Try to find cached binary versions:
f35822af
VS
536 // 1. save file as book, but with .hhp.cached extension
537 // 2. same as 1. but in temp path
538 // 3. otherwise or if cache load failed, load it from MS.
04dbb646 539
f35822af 540 fi = fsys.OpenFile(bookfile.GetLocation() + wxT(".cached"));
04dbb646
VZ
541
542 if (fi == NULL ||
e2b87f38 543#if wxUSE_DATETIME
04dbb646 544 fi->GetModificationTime() < bookfile.GetModificationTime() ||
e2b87f38 545#endif // wxUSE_DATETIME
4f9297b0 546 !LoadCachedBook(bookr, fi->GetStream()))
f35822af
VS
547 {
548 if (fi != NULL) delete fi;
91fa114d
VS
549 fi = fsys.OpenFile(m_tempPath + wxFileNameFromPath(bookfile.GetLocation()) + wxT(".cached"));
550 if (m_tempPath.empty() || fi == NULL ||
e2b87f38 551#if wxUSE_DATETIME
04dbb646 552 fi->GetModificationTime() < bookfile.GetModificationTime() ||
e2b87f38 553#endif // wxUSE_DATETIME
4f9297b0 554 !LoadCachedBook(bookr, fi->GetStream()))
f35822af
VS
555 {
556 LoadMSProject(bookr, fsys, indexfile, contfile);
91fa114d 557 if (!m_tempPath.empty())
f35822af 558 {
91fa114d 559 wxFileOutputStream *outs = new wxFileOutputStream(m_tempPath +
29e60597 560 SafeFileName(wxFileNameFromPath(bookfile.GetLocation())) + wxT(".cached"));
f35822af
VS
561 SaveCachedBook(bookr, outs);
562 delete outs;
563 }
d5bb85a0 564 }
8ec2b484 565 }
04dbb646 566
f35822af 567 if (fi != NULL) delete fi;
8ec2b484
HH
568
569 // Now store the contents range
91fa114d 570 bookr->SetContentsRange(cont_start, m_contents.size());
04dbb646 571
3912b3f8
VS
572 // MS HTML Help files [written by MS HTML Help Workshop] are broken
573 // in that the data are iso-8859-1 (including HTML entities), but must
574 // be interpreted as being in language's windows charset. Correct the
575 // differences here and also convert to wxConvLocal in ANSI build
67c276bd 576 if (encoding != wxFONTENCODING_SYSTEM)
3912b3f8
VS
577 {
578 #if wxUSE_UNICODE
579 #define CORRECT_STR(str, conv) \
580 str = wxString((str).mb_str(wxConvISO8859_1), conv)
581 #else
582 #define CORRECT_STR(str, conv) \
583 str = wxString((str).wc_str(conv), wxConvLocal)
584 #endif
67c276bd 585 wxCSConv conv(encoding);
91fa114d
VS
586 size_t IndexCnt = m_index.size();
587 size_t ContentsCnt = m_contents.size();
588 size_t i;
589 for (i = IndexOld; i < IndexCnt; i++)
f890e2d4 590 {
91fa114d 591 CORRECT_STR(m_index[i].name, conv);
f890e2d4 592 }
91fa114d 593 for (i = ContentsOld; i < ContentsCnt; i++)
3912b3f8 594 {
91fa114d 595 CORRECT_STR(m_contents[i].name, conv);
3912b3f8
VS
596 }
597 #undef CORRECT_STR
f890e2d4 598 }
8ec2b484 599
91fa114d
VS
600 m_bookRecords.Add(bookr);
601 if (!m_index.empty())
602 {
603 m_index.Sort(wxHtmlHelpIndexCompareFunc);
604 }
f42b1601 605
91fa114d 606 return true;
8ec2b484
HH
607}
608
609
610bool wxHtmlHelpData::AddBook(const wxString& book)
611{
3527f29c
VS
612 wxString extension(book.Right(4).Lower());
613 if (extension == wxT(".zip") ||
614#if wxUSE_LIBMSPACK
615 extension == wxT(".chm") /*compressed html help book*/ ||
616#endif
617 extension == wxT(".htb") /*html book*/)
68364659
VS
618 {
619 wxFileSystem fsys;
620 wxString s;
d1da8872 621 bool rt = false;
68364659 622
3527f29c
VS
623#if wxUSE_LIBMSPACK
624 if (extension == wxT(".chm"))
625 s = fsys.FindFirst(book + wxT("#chm:*.hhp"), wxFILE);
626 else
627#endif
628 s = fsys.FindFirst(book + wxT("#zip:*.hhp"), wxFILE);
629
93763ad5 630 while (!s.empty())
68364659 631 {
d1da8872 632 if (AddBook(s)) rt = true;
68364659
VS
633 s = fsys.FindNext();
634 }
04dbb646 635
68364659
VS
636 return rt;
637 }
68364659 638
a509f830
VZ
639 wxFSFile *fi;
640 wxFileSystem fsys;
3dde6c72 641
a509f830
VZ
642 wxString title = _("noname"),
643 safetitle,
644 start = wxEmptyString,
645 contents = wxEmptyString,
646 index = wxEmptyString,
647 charset = wxEmptyString;
68364659 648
a509f830
VZ
649 fi = fsys.OpenFile(book);
650 if (fi == NULL)
651 {
652 wxLogError(_("Cannot open HTML help book: %s"), book.c_str());
d1da8872 653 return false;
68364659 654 }
a509f830
VZ
655 fsys.ChangePathTo(book);
656
657 const wxChar *lineptr;
658 wxChar linebuf[300];
659 wxString tmp;
660 wxHtmlFilterPlainText filter;
661 tmp = filter.ReadFile(*fi);
662 lineptr = tmp.c_str();
663
d1da8872 664 do
a509f830
VZ
665 {
666 lineptr = ReadLine(lineptr, linebuf, 300);
d1da8872 667
a509f830 668 for (wxChar *ch = linebuf; *ch != wxT('\0') && *ch != wxT('='); ch++)
42841dfc 669 *ch = (wxChar)wxTolower(*ch);
a509f830 670
9a83f860
VZ
671 if (wxStrstr(linebuf, wxT("title=")) == linebuf)
672 title = linebuf + wxStrlen(wxT("title="));
673 if (wxStrstr(linebuf, wxT("default topic=")) == linebuf)
674 start = linebuf + wxStrlen(wxT("default topic="));
675 if (wxStrstr(linebuf, wxT("index file=")) == linebuf)
676 index = linebuf + wxStrlen(wxT("index file="));
677 if (wxStrstr(linebuf, wxT("contents file=")) == linebuf)
678 contents = linebuf + wxStrlen(wxT("contents file="));
679 if (wxStrstr(linebuf, wxT("charset=")) == linebuf)
680 charset = linebuf + wxStrlen(wxT("charset="));
a509f830 681 } while (lineptr != NULL);
d1da8872 682
5a969262
RR
683 wxFontEncoding enc = wxFONTENCODING_SYSTEM;
684#if wxUSE_FONTMAP
685 if (charset != wxEmptyString)
686 enc = wxFontMapper::Get()->CharsetToEncoding(charset);
687#endif
a509f830 688
67c276bd 689 bool rtval = AddBookParam(*fi, enc,
a509f830
VZ
690 title, contents, index, start, fsys.GetPath());
691 delete fi;
91fa114d 692
a509f830 693 return rtval;
8ec2b484
HH
694}
695
696wxString wxHtmlHelpData::FindPageByName(const wxString& x)
697{
8ec2b484 698 int i;
8ec2b484 699
8680ee06
RR
700 bool has_non_ascii = false;
701 wxString::const_iterator it;
702 for (it = x.begin(); it != x.end(); ++it)
703 {
704 wxUniChar ch = *it;
705 if (!ch.IsAscii())
706 {
707 has_non_ascii = true;
708 break;
709 }
710 }
03647350 711
8680ee06 712 int cnt = m_bookRecords.GetCount();
03647350 713
8680ee06 714 if (!has_non_ascii)
4f9297b0 715 {
8680ee06
RR
716 wxFileSystem fsys;
717 wxFSFile *f;
718 // 1. try to open given file:
719 for (i = 0; i < cnt; i++)
720 {
91fa114d 721 f = fsys.OpenFile(m_bookRecords[i].GetFullPath(x));
04dbb646
VZ
722 if (f)
723 {
91fa114d 724 wxString url = m_bookRecords[i].GetFullPath(x);
8ec2b484
HH
725 delete f;
726 return url;
727 }
8680ee06 728 }
8ec2b484
HH
729 }
730
731
735a74df 732 // 2. try to find a book:
04dbb646 733 for (i = 0; i < cnt; i++)
4f9297b0 734 {
91fa114d
VS
735 if (m_bookRecords[i].GetTitle() == x)
736 return m_bookRecords[i].GetFullPath(m_bookRecords[i].GetStart());
8ec2b484
HH
737 }
738
735a74df 739 // 3. try to find in contents:
91fa114d 740 cnt = m_contents.size();
04dbb646 741 for (i = 0; i < cnt; i++)
4f9297b0 742 {
91fa114d
VS
743 if (m_contents[i].name == x)
744 return m_contents[i].GetFullPath();
8ec2b484
HH
745 }
746
747
735a74df 748 // 4. try to find in index:
91fa114d 749 cnt = m_index.size();
04dbb646 750 for (i = 0; i < cnt; i++)
4f9297b0 751 {
91fa114d
VS
752 if (m_index[i].name == x)
753 return m_index[i].GetFullPath();
8ec2b484
HH
754 }
755
735a74df
VZ
756 // 4b. if still not found, try case-insensitive comparison
757 for (i = 0; i < cnt; i++)
758 {
759 if (m_index[i].name.CmpNoCase(x) == 0)
760 return m_index[i].GetFullPath();
761 }
762
91fa114d 763 return wxEmptyString;
8ec2b484
HH
764}
765
766wxString wxHtmlHelpData::FindPageById(int id)
f42b1601 767{
91fa114d
VS
768 size_t cnt = m_contents.size();
769 for (size_t i = 0; i < cnt; i++)
4f9297b0 770 {
91fa114d 771 if (m_contents[i].id == id)
04dbb646 772 {
91fa114d 773 return m_contents[i].GetFullPath();
8ec2b484
HH
774 }
775 }
776
91fa114d
VS
777 return wxEmptyString;
778}
779
91fa114d 780
8ec2b484
HH
781//----------------------------------------------------------------------------------
782// wxHtmlSearchStatus functions
783//----------------------------------------------------------------------------------
784
785wxHtmlSearchStatus::wxHtmlSearchStatus(wxHtmlHelpData* data, const wxString& keyword,
c4971147 786 bool case_sensitive, bool whole_words_only,
d5bb85a0 787 const wxString& book)
8ec2b484
HH
788{
789 m_Data = data;
790 m_Keyword = keyword;
791 wxHtmlBookRecord* bookr = NULL;
04dbb646 792 if (book != wxEmptyString)
4f9297b0 793 {
d5bb85a0 794 // we have to search in a specific book. Find it first
91fa114d 795 int i, cnt = data->m_bookRecords.GetCount();
d5bb85a0 796 for (i = 0; i < cnt; i++)
91fa114d 797 if (data->m_bookRecords[i].GetTitle() == book)
04dbb646 798 {
91fa114d 799 bookr = &(data->m_bookRecords[i]);
d5bb85a0
VS
800 m_CurIndex = bookr->GetContentsStart();
801 m_MaxIndex = bookr->GetContentsEnd();
802 break;
803 }
804 // check; we won't crash if the book doesn't exist, but it's Bad Anyway.
805 wxASSERT(bookr);
8ec2b484 806 }
04dbb646 807 if (! bookr)
4f9297b0 808 {
d5bb85a0
VS
809 // no book specified; search all books
810 m_CurIndex = 0;
91fa114d 811 m_MaxIndex = m_Data->m_contents.size();
8ec2b484 812 }
c4971147 813 m_Engine.LookFor(keyword, case_sensitive, whole_words_only);
8ec2b484 814 m_Active = (m_CurIndex < m_MaxIndex);
8ec2b484
HH
815}
816
817bool wxHtmlSearchStatus::Search()
818{
8ec2b484 819 wxFSFile *file;
d5bb85a0 820 int i = m_CurIndex; // shortcut
91fa114d 821 bool found = false;
3912b3f8 822 wxString thepage;
8ec2b484 823
04dbb646 824 if (!m_Active)
4f9297b0 825 {
f35822af 826 // sanity check. Illegal use, but we'll try to prevent a crash anyway
50494a55 827 wxASSERT(m_Active);
91fa114d 828 return false;
8ec2b484
HH
829 }
830
8ec2b484 831 m_Name = wxEmptyString;
91fa114d
VS
832 m_CurItem = NULL;
833 thepage = m_Data->m_contents[i].page;
8ec2b484 834
b5a7b000
VS
835 m_Active = (++m_CurIndex < m_MaxIndex);
836 // check if it is same page with different anchor:
3912b3f8 837 if (!m_LastPage.empty())
b5a7b000 838 {
3912b3f8
VS
839 const wxChar *p1, *p2;
840 for (p1 = thepage.c_str(), p2 = m_LastPage.c_str();
9a83f860 841 *p1 != 0 && *p1 != wxT('#') && *p1 == *p2; p1++, p2++) {}
b5a7b000
VS
842
843 m_LastPage = thepage;
844
9a83f860 845 if (*p1 == 0 || *p1 == wxT('#'))
3912b3f8 846 return false;
b5a7b000
VS
847 }
848 else m_LastPage = thepage;
04dbb646 849
f35822af 850 wxFileSystem fsys;
91fa114d 851 file = fsys.OpenFile(m_Data->m_contents[i].book->GetFullPath(thepage));
04dbb646 852 if (file)
b5a7b000 853 {
2b5f62a0 854 if (m_Engine.Scan(*file))
468ae730 855 {
91fa114d
VS
856 m_Name = m_Data->m_contents[i].name;
857 m_CurItem = &m_Data->m_contents[i];
858 found = true;
d5bb85a0
VS
859 }
860 delete file;
8ec2b484 861 }
8ec2b484
HH
862 return found;
863}
864
d5bb85a0
VS
865
866
867
868
869
870
871
872//--------------------------------------------------------------------------------
2b5f62a0 873// wxHtmlSearchEngine
d5bb85a0
VS
874//--------------------------------------------------------------------------------
875
2b5f62a0 876void wxHtmlSearchEngine::LookFor(const wxString& keyword, bool case_sensitive, bool whole_words_only)
d5bb85a0 877{
c4971147
VS
878 m_CaseSensitive = case_sensitive;
879 m_WholeWords = whole_words_only;
3912b3f8 880 m_Keyword = keyword;
04dbb646 881
3444e4a8 882 if (!m_CaseSensitive)
3912b3f8 883 m_Keyword.LowerCase();
d5bb85a0
VS
884}
885
886
1a1dac18
MB
887static inline bool WHITESPACE(wxChar c)
888{
9a83f860 889 return c == wxT(' ') || c == wxT('\n') || c == wxT('\r') || c == wxT('\t');
1a1dac18 890}
c4971147 891
21dc4638
VZ
892// replace continuous spaces by one single space
893static inline wxString CompressSpaces(const wxString & str)
894{
895 wxString buf;
896 buf.reserve( str.size() );
897
898 bool space_counted = false;
899 for( const wxChar * pstr = str.c_str(); *pstr; ++pstr )
900 {
901 wxChar ch = *pstr;
902 if( WHITESPACE( ch ) )
903 {
904 if( space_counted )
905 {
906 continue;
907 }
9a83f860 908 ch = wxT(' ');
21dc4638
VZ
909 space_counted = true;
910 }
911 else
912 {
913 space_counted = false;
914 }
915 buf += ch;
916 }
917
918 return buf;
919}
920
2b5f62a0 921bool wxHtmlSearchEngine::Scan(const wxFSFile& file)
d5bb85a0 922{
3912b3f8 923 wxASSERT_MSG(!m_Keyword.empty(), wxT("wxHtmlSearchEngine::LookFor must be called before scanning!"));
d5bb85a0 924
2b5f62a0 925 wxHtmlFilterHTML filter;
21dc4638 926 wxString bufStr = filter.ReadFile(file);
d5bb85a0 927
c4971147 928 if (!m_CaseSensitive)
21dc4638 929 bufStr.LowerCase();
d5bb85a0 930
21dc4638
VZ
931 { // remove html tags
932 wxString bufStrCopy;
933 bufStrCopy.reserve( bufStr.size() );
934 bool insideTag = false;
935 for (const wxChar * pBufStr = bufStr.c_str(); *pBufStr; ++pBufStr)
04dbb646 936 {
21dc4638
VZ
937 wxChar c = *pBufStr;
938 if (insideTag)
939 {
9a83f860 940 if (c == wxT('>'))
21dc4638
VZ
941 {
942 insideTag = false;
943 // replace the tag by an empty space
9a83f860 944 c = wxT(' ');
21dc4638
VZ
945 }
946 else
947 continue;
948 }
9a83f860 949 else if (c == wxT('<'))
21dc4638
VZ
950 {
951 wxChar nextCh = *(pBufStr + 1);
9a83f860 952 if (nextCh == wxT('/') || !WHITESPACE(nextCh))
21dc4638
VZ
953 {
954 insideTag = true;
955 continue;
956 }
957 }
958 bufStrCopy += c;
c4971147 959 }
21dc4638 960 bufStr.swap( bufStrCopy );
c4971147 961 }
04dbb646 962
21dc4638
VZ
963 wxString keyword = m_Keyword;
964
965 if (m_WholeWords)
c4971147 966 {
21dc4638 967 // insert ' ' at the beginning and at the end
9a83f860
VZ
968 keyword.insert( 0, wxT(" ") );
969 keyword.append( wxT(" ") );
970 bufStr.insert( 0, wxT(" ") );
971 bufStr.append( wxT(" ") );
d5bb85a0
VS
972 }
973
21dc4638
VZ
974 // remove continuous spaces
975 keyword = CompressSpaces( keyword );
976 bufStr = CompressSpaces( bufStr );
d5bb85a0 977
21dc4638
VZ
978 // finally do the search
979 return bufStr.find( keyword ) != wxString::npos;
980}
d5bb85a0 981
8ec2b484 982#endif