]> git.saurik.com Git - wxWidgets.git/blame - src/html/helpdata.cpp
recognize CP866 (bug 1497808)
[wxWidgets.git] / src / html / helpdata.cpp
CommitLineData
8ec2b484 1/////////////////////////////////////////////////////////////////////////////
93763ad5 2// Name: src/html/helpdata.cpp
8ec2b484 3// Purpose: wxHtmlHelpData
f42b1601 4// Notes: Based on htmlhelp.cpp, implementing a monolithic
8ec2b484
HH
5// HTML Help controller class, by Vaclav Slavik
6// Author: Harm van der Heijden and Vaclav Slavik
69941f05 7// RCS-ID: $Id$
8ec2b484 8// Copyright: (c) Harm van der Heijden and Vaclav Slavik
65571936 9// Licence: wxWindows licence
8ec2b484
HH
10/////////////////////////////////////////////////////////////////////////////
11
8ec2b484
HH
12// For compilers that support precompilation, includes "wx.h".
13#include "wx/wxprec.h"
14
15#ifdef __BORLANDC__
93763ad5 16 #pragma hdrstop
8ec2b484
HH
17#endif
18
f6bcfd97 19#if wxUSE_HTML && wxUSE_STREAMS
8ec2b484
HH
20
21#ifndef WXPRECOMP
04dbb646
VZ
22 #include "wx/intl.h"
23 #include "wx/log.h"
8ec2b484
HH
24#endif
25
401eb3de
RR
26#include <ctype.h>
27
8ec2b484
HH
28#include "wx/html/helpdata.h"
29#include "wx/tokenzr.h"
30#include "wx/wfstream.h"
31#include "wx/busyinfo.h"
f890e2d4
VS
32#include "wx/encconv.h"
33#include "wx/fontmap.h"
69941f05 34#include "wx/html/htmlpars.h"
8ec2b484 35#include "wx/html/htmldefs.h"
2b5f62a0 36#include "wx/html/htmlfilt.h"
057b55b0 37#include "wx/filename.h"
8ec2b484
HH
38
39#include "wx/arrimpl.cpp"
40WX_DEFINE_OBJARRAY(wxHtmlBookRecArray)
91fa114d 41WX_DEFINE_OBJARRAY(wxHtmlHelpDataItems)
8ec2b484
HH
42
43//-----------------------------------------------------------------------------
44// static helper functions
45//-----------------------------------------------------------------------------
46
47// Reads one line, stores it into buf and returns pointer to new line or NULL.
1a1dac18 48static const wxChar* ReadLine(const wxChar *line, wxChar *buf, size_t bufsize)
8ec2b484 49{
1a1dac18
MB
50 wxChar *writeptr = buf;
51 wxChar *endptr = buf + bufsize - 1;
52 const wxChar *readptr = line;
8ec2b484 53
1a1dac18 54 while (*readptr != 0 && *readptr != _T('\r') && *readptr != _T('\n') &&
d1da8872 55 writeptr != endptr)
3dde6c72 56 *(writeptr++) = *(readptr++);
8ec2b484 57 *writeptr = 0;
1a1dac18 58 while (*readptr == _T('\r') || *readptr == _T('\n'))
3dde6c72
VS
59 readptr++;
60 if (*readptr == 0)
61 return NULL;
d1da8872 62 else
3dde6c72 63 return readptr;
8ec2b484
HH
64}
65
66
8ec2b484 67
91fa114d
VS
68static int
69wxHtmlHelpIndexCompareFunc(wxHtmlHelpDataItem **a, wxHtmlHelpDataItem **b)
8ec2b484 70{
91fa114d
VS
71 wxHtmlHelpDataItem *ia = *a;
72 wxHtmlHelpDataItem *ib = *b;
3912b3f8 73
7fbe5489
VS
74 if (ia == NULL)
75 return -1;
76 if (ib == NULL)
77 return 1;
42841dfc 78
91fa114d
VS
79 if (ia->parent == ib->parent)
80 {
81 return ia->name.CmpNoCase(ib->name);
82 }
83 else if (ia->level == ib->level)
84 {
85 return wxHtmlHelpIndexCompareFunc(&ia->parent, &ib->parent);
86 }
87 else
88 {
89 wxHtmlHelpDataItem *ia2 = ia;
90 wxHtmlHelpDataItem *ib2 = ib;
d1da8872 91
91fa114d
VS
92 while (ia2->level > ib2->level)
93 {
94 ia2 = ia2->parent;
95 }
96 while (ib2->level > ia2->level)
97 {
98 ib2 = ib2->parent;
99 }
d1da8872 100
91fa114d
VS
101 wxASSERT(ia2);
102 wxASSERT(ib2);
103 int res = wxHtmlHelpIndexCompareFunc(&ia2, &ib2);
104 if (res != 0)
105 return res;
106 else if (ia->level > ib->level)
107 return 1;
108 else
109 return -1;
110 }
8ec2b484
HH
111}
112
8ec2b484
HH
113//-----------------------------------------------------------------------------
114// HP_Parser
115//-----------------------------------------------------------------------------
116
117class HP_Parser : public wxHtmlParser
118{
211dfedd 119public:
67c276bd
VS
120 HP_Parser()
121 {
122 GetEntitiesParser()->SetEncoding(wxFONTENCODING_ISO8859_1);
123 }
fc7a2a60 124
211dfedd 125 wxObject* GetProduct() { return NULL; }
fc7a2a60 126
211dfedd
VS
127protected:
128 virtual void AddText(const wxChar* WXUNUSED(txt)) {}
fc7a2a60
VZ
129
130 DECLARE_NO_COPY_CLASS(HP_Parser)
8ec2b484
HH
131};
132
133
134//-----------------------------------------------------------------------------
135// HP_TagHandler
136//-----------------------------------------------------------------------------
137
138class HP_TagHandler : public wxHtmlTagHandler
139{
140 private:
91fa114d
VS
141 wxString m_name, m_page;
142 int m_level;
143 int m_id;
144 int m_index;
145 int m_count;
146 wxHtmlHelpDataItem *m_parentItem;
147 wxHtmlBookRecord *m_book;
d1da8872 148
91fa114d 149 wxHtmlHelpDataItems *m_data;
8ec2b484
HH
150
151 public:
04dbb646 152 HP_TagHandler(wxHtmlBookRecord *b) : wxHtmlTagHandler()
91fa114d
VS
153 {
154 m_data = NULL;
155 m_book = b;
156 m_name = m_page = wxEmptyString;
157 m_level = 0;
d1da8872 158 m_id = wxID_ANY;
91fa114d
VS
159 m_count = 0;
160 m_parentItem = NULL;
161 }
66a77a74 162 wxString GetSupportedTags() { return wxT("UL,OBJECT,PARAM"); }
8ec2b484 163 bool HandleTag(const wxHtmlTag& tag);
91fa114d
VS
164
165 void Reset(wxHtmlHelpDataItems& data)
166 {
167 m_data = &data;
168 m_count = 0;
169 m_level = 0;
170 m_parentItem = NULL;
171 }
22f3361e
VZ
172
173 DECLARE_NO_COPY_CLASS(HP_TagHandler)
8ec2b484
HH
174};
175
176
177bool HP_TagHandler::HandleTag(const wxHtmlTag& tag)
178{
04dbb646 179 if (tag.GetName() == wxT("UL"))
4f9297b0 180 {
91fa114d
VS
181 wxHtmlHelpDataItem *oldparent = m_parentItem;
182 m_level++;
183 m_parentItem = (m_count > 0) ? &(*m_data)[m_data->size()-1] : NULL;
8ec2b484 184 ParseInner(tag);
91fa114d
VS
185 m_level--;
186 m_parentItem = oldparent;
187 return true;
8ec2b484 188 }
04dbb646 189 else if (tag.GetName() == wxT("OBJECT"))
4f9297b0 190 {
91fa114d 191 m_name = m_page = wxEmptyString;
8ec2b484 192 ParseInner(tag);
50494a55 193
daa084c2 194#if 0
91fa114d 195 if (!page.IsEmpty())
7df9fbc3 196 /* Valid HHW's file may contain only two object tags:
04dbb646 197
4157f43f
VS
198 <OBJECT type="text/site properties">
199 <param name="ImageType" value="Folder">
200 </OBJECT>
04dbb646 201
4157f43f 202 or
04dbb646
VZ
203
204 <OBJECT type="text/sitemap">
205 <param name="Name" value="main page">
206 <param name="Local" value="another.htm">
207 </OBJECT>
208
91fa114d 209 We're interested in the latter. !page.IsEmpty() is valid
4157f43f
VS
210 condition because text/site properties does not contain Local param
211 */
daa084c2
VS
212#endif
213 if (tag.GetParam(wxT("TYPE")) == wxT("text/sitemap"))
4157f43f 214 {
91fa114d
VS
215 wxHtmlHelpDataItem *item = new wxHtmlHelpDataItem();
216 item->parent = m_parentItem;
217 item->level = m_level;
218 item->id = m_id;
219 item->page = m_page;
220 item->name = m_name;
d1da8872 221
91fa114d
VS
222 item->book = m_book;
223 m_data->Add(item);
224 m_count++;
4157f43f 225 }
50494a55 226
91fa114d 227 return true;
8ec2b484 228 }
04dbb646 229 else
4f9297b0 230 { // "PARAM"
91fa114d
VS
231 if (m_name.empty() && tag.GetParam(wxT("NAME")) == wxT("Name"))
232 m_name = tag.GetParam(wxT("VALUE"));
04dbb646 233 if (tag.GetParam(wxT("NAME")) == wxT("Local"))
91fa114d 234 m_page = tag.GetParam(wxT("VALUE"));
04dbb646 235 if (tag.GetParam(wxT("NAME")) == wxT("ID"))
91fa114d
VS
236 tag.GetParamAsInt(wxT("VALUE"), &m_id);
237 return false;
8ec2b484
HH
238 }
239}
240
241
8ec2b484
HH
242//-----------------------------------------------------------------------------
243// wxHtmlHelpData
244//-----------------------------------------------------------------------------
245
468ae730
VS
246wxString wxHtmlBookRecord::GetFullPath(const wxString &page) const
247{
248 if (wxIsAbsolutePath(page))
249 return page;
250 else
251 return m_BasePath + page;
252}
253
91fa114d
VS
254wxString wxHtmlHelpDataItem::GetIndentedName() const
255{
256 wxString s;
257 for (int i = 1; i < level; i++)
258 s << _T(" ");
259 s << name;
260 return s;
261}
468ae730
VS
262
263
8ec2b484
HH
264IMPLEMENT_DYNAMIC_CLASS(wxHtmlHelpData, wxObject)
265
f42b1601 266wxHtmlHelpData::wxHtmlHelpData()
8ec2b484 267{
91fa114d
VS
268#if WXWIN_COMPATIBILITY_2_4
269 m_cacheContents = NULL;
270 m_cacheIndex = NULL;
271#endif
8ec2b484
HH
272}
273
274wxHtmlHelpData::~wxHtmlHelpData()
275{
91fa114d
VS
276#if WXWIN_COMPATIBILITY_2_4
277 CleanCompatibilityData();
278#endif
8ec2b484
HH
279}
280
67c276bd
VS
281bool wxHtmlHelpData::LoadMSProject(wxHtmlBookRecord *book, wxFileSystem& fsys,
282 const wxString& indexfile,
283 const wxString& contentsfile)
8ec2b484
HH
284{
285 wxFSFile *f;
2b5f62a0 286 wxHtmlFilterHTML filter;
eb37e1d2 287 wxString buf;
8ec2b484 288 wxString string;
f42b1601 289
8ec2b484
HH
290 HP_Parser parser;
291 HP_TagHandler *handler = new HP_TagHandler(book);
292 parser.AddTagHandler(handler);
293
93763ad5 294 f = ( contentsfile.empty() ? (wxFSFile*) NULL : fsys.OpenFile(contentsfile) );
04dbb646 295 if (f)
4f9297b0 296 {
eb37e1d2 297 buf.clear();
2b5f62a0 298 buf = filter.ReadFile(*f);
8ec2b484 299 delete f;
91fa114d 300 handler->Reset(m_contents);
8ec2b484 301 parser.Parse(buf);
8ec2b484 302 }
f3c82859 303 else
2b5f62a0 304 {
f6bcfd97 305 wxLogError(_("Cannot open contents file: %s"), contentsfile.c_str());
2b5f62a0 306 }
8ec2b484 307
93763ad5 308 f = ( indexfile.empty() ? (wxFSFile*) NULL : fsys.OpenFile(indexfile) );
04dbb646 309 if (f)
4f9297b0 310 {
eb37e1d2 311 buf.clear();
2b5f62a0 312 buf = filter.ReadFile(*f);
8ec2b484 313 delete f;
91fa114d 314 handler->Reset(m_index);
8ec2b484 315 parser.Parse(buf);
8ec2b484 316 }
93763ad5 317 else if (!indexfile.empty())
2b5f62a0 318 {
f6bcfd97 319 wxLogError(_("Cannot open index file: %s"), indexfile.c_str());
2b5f62a0 320 }
d1da8872 321 return true;
8ec2b484
HH
322}
323
4fd5055c
VS
324inline static void CacheWriteInt32(wxOutputStream *f, wxInt32 value)
325{
326 wxInt32 x = wxINT32_SWAP_ON_BE(value);
327 f->Write(&x, sizeof(x));
328}
f35822af 329
4fd5055c
VS
330inline static wxInt32 CacheReadInt32(wxInputStream *f)
331{
332 wxInt32 x;
333 f->Read(&x, sizeof(x));
334 return wxINT32_SWAP_ON_BE(x);
335}
f35822af 336
3912b3f8 337inline static void CacheWriteString(wxOutputStream *f, const wxString& str)
d1da8872 338{
3912b3f8
VS
339 const wxWX2MBbuf mbstr = str.mb_str(wxConvUTF8);
340 size_t len = strlen((const char*)mbstr)+1;
4fd5055c 341 CacheWriteInt32(f, len);
3912b3f8 342 f->Write((const char*)mbstr, len);
4fd5055c 343}
f35822af 344
3912b3f8 345inline static wxString CacheReadString(wxInputStream *f)
4fd5055c 346{
4fd5055c 347 size_t len = (size_t)CacheReadInt32(f);
3912b3f8
VS
348 wxCharBuffer str(len-1);
349 f->Read(str.data(), len);
350 return wxString(str, wxConvUTF8);
4fd5055c 351}
f35822af 352
91fa114d 353#define CURRENT_CACHED_BOOK_VERSION 5
d1a9c82b
VS
354
355// Additional flags to detect incompatibilities of the runtime environment:
356#define CACHED_BOOK_FORMAT_FLAGS \
357 (wxUSE_UNICODE << 0)
358
f35822af 359
8ec2b484
HH
360bool wxHtmlHelpData::LoadCachedBook(wxHtmlBookRecord *book, wxInputStream *f)
361{
91fa114d 362 int i, st, newsize;
f35822af
VS
363 wxInt32 version;
364
365 /* load header - version info : */
4fd5055c 366 version = CacheReadInt32(f);
d1da8872 367
04dbb646 368 if (version != CURRENT_CACHED_BOOK_VERSION)
f3c82859 369 {
d1da8872 370 // NB: We can just silently return false here and don't worry about
4fd5055c 371 // it anymore, because AddBookParam will load the MS project in
d1da8872 372 // absence of (properly versioned) .cached file and automatically
4fd5055c 373 // create new .cached file immediately afterward.
91fa114d 374 return false;
f3c82859 375 }
04dbb646 376
d1a9c82b 377 if (CacheReadInt32(f) != CACHED_BOOK_FORMAT_FLAGS)
91fa114d 378 return false;
d1a9c82b 379
8ec2b484 380 /* load contents : */
91fa114d
VS
381 st = m_contents.size();
382 newsize = st + CacheReadInt32(f);
383 m_contents.Alloc(newsize);
384 for (i = st; i < newsize; i++)
4f9297b0 385 {
91fa114d
VS
386 wxHtmlHelpDataItem *item = new wxHtmlHelpDataItem;
387 item->level = CacheReadInt32(f);
388 item->id = CacheReadInt32(f);
389 item->name = CacheReadString(f);
390 item->page = CacheReadString(f);
391 item->book = book;
392 m_contents.Add(item);
8ec2b484
HH
393 }
394
395 /* load index : */
91fa114d
VS
396 st = m_index.size();
397 newsize = st + CacheReadInt32(f);
398 m_index.Alloc(newsize);
399 for (i = st; i < newsize; i++)
4f9297b0 400 {
91fa114d
VS
401 wxHtmlHelpDataItem *item = new wxHtmlHelpDataItem;
402 item->name = CacheReadString(f);
403 item->page = CacheReadString(f);
404 item->level = CacheReadInt32(f);
405 item->book = book;
406 int parentShift = CacheReadInt32(f);
407 if (parentShift != 0)
408 item->parent = &m_index[m_index.size() - parentShift];
409 m_index.Add(item);
8ec2b484 410 }
91fa114d 411 return true;
8ec2b484
HH
412}
413
414
415bool wxHtmlHelpData::SaveCachedBook(wxHtmlBookRecord *book, wxOutputStream *f)
416{
417 int i;
4fd5055c 418 wxInt32 cnt;
f35822af
VS
419
420 /* save header - version info : */
4fd5055c 421 CacheWriteInt32(f, CURRENT_CACHED_BOOK_VERSION);
d1a9c82b 422 CacheWriteInt32(f, CACHED_BOOK_FORMAT_FLAGS);
8ec2b484
HH
423
424 /* save contents : */
91fa114d 425 int len = m_contents.size();
d1da8872 426 for (cnt = 0, i = 0; i < len; i++)
91fa114d 427 if (m_contents[i].book == book && m_contents[i].level > 0)
4fd5055c
VS
428 cnt++;
429 CacheWriteInt32(f, cnt);
8ec2b484 430
91fa114d 431 for (i = 0; i < len; i++)
4f9297b0 432 {
d1da8872 433 if (m_contents[i].book != book || m_contents[i].level == 0)
4fd5055c 434 continue;
91fa114d
VS
435 CacheWriteInt32(f, m_contents[i].level);
436 CacheWriteInt32(f, m_contents[i].id);
437 CacheWriteString(f, m_contents[i].name);
438 CacheWriteString(f, m_contents[i].page);
8ec2b484
HH
439 }
440
441 /* save index : */
91fa114d 442 len = m_index.size();
d1da8872
WS
443 for (cnt = 0, i = 0; i < len; i++)
444 if (m_index[i].book == book && m_index[i].level > 0)
4fd5055c
VS
445 cnt++;
446 CacheWriteInt32(f, cnt);
8ec2b484 447
91fa114d 448 for (i = 0; i < len; i++)
4f9297b0 449 {
d1da8872 450 if (m_index[i].book != book || m_index[i].level == 0)
4fd5055c 451 continue;
91fa114d
VS
452 CacheWriteString(f, m_index[i].name);
453 CacheWriteString(f, m_index[i].page);
454 CacheWriteInt32(f, m_index[i].level);
455 // save distance to parent item, if any:
456 if (m_index[i].parent == NULL)
457 {
458 CacheWriteInt32(f, 0);
459 }
460 else
461 {
17a1ebd1 462 int cnt2 = 0;
91fa114d
VS
463 wxHtmlHelpDataItem *parent = m_index[i].parent;
464 for (int j = i-1; j >= 0; j--)
465 {
466 if (m_index[j].book == book && m_index[j].level > 0)
17a1ebd1 467 cnt2++;
91fa114d
VS
468 if (&m_index[j] == parent)
469 break;
470 }
17a1ebd1
VZ
471 wxASSERT(cnt2 > 0);
472 CacheWriteInt32(f, cnt2);
91fa114d 473 }
8ec2b484 474 }
91fa114d 475 return true;
8ec2b484
HH
476}
477
478
479void wxHtmlHelpData::SetTempDir(const wxString& path)
480{
91fa114d
VS
481 if (path.empty())
482 m_tempPath = path;
04dbb646 483 else
4f9297b0 484 {
91fa114d
VS
485 if (wxIsAbsolutePath(path)) m_tempPath = path;
486 else m_tempPath = wxGetCwd() + _T("/") + path;
8ec2b484 487
93763ad5 488 if (m_tempPath[m_tempPath.length() - 1] != _T('/'))
91fa114d 489 m_tempPath << _T('/');
8ec2b484
HH
490 }
491}
492
493
29e60597
VS
494
495static wxString SafeFileName(const wxString& s)
496{
497 wxString res(s);
498 res.Replace(wxT("#"), wxT("_"));
499 res.Replace(wxT(":"), wxT("_"));
500 res.Replace(wxT("\\"), wxT("_"));
501 res.Replace(wxT("/"), wxT("_"));
502 return res;
503}
504
f35822af 505bool wxHtmlHelpData::AddBookParam(const wxFSFile& bookfile,
f890e2d4 506 wxFontEncoding encoding,
f35822af 507 const wxString& title, const wxString& contfile,
d5bb85a0
VS
508 const wxString& indexfile, const wxString& deftopic,
509 const wxString& path)
8ec2b484
HH
510{
511 wxFileSystem fsys;
512 wxFSFile *fi;
513 wxHtmlBookRecord *bookr;
04dbb646 514
91fa114d
VS
515 int IndexOld = m_index.size(),
516 ContentsOld = m_contents.size();
f42b1601 517
93763ad5 518 if (!path.empty())
d1da8872 519 fsys.ChangePathTo(path, true);
8ec2b484 520
91fa114d 521 size_t booksCnt = m_bookRecords.GetCount();
5ecdcaa7
VS
522 for (size_t i = 0; i < booksCnt; i++)
523 {
91fa114d
VS
524 if ( m_bookRecords[i].GetBookFile() == bookfile.GetLocation() )
525 return true; // book is (was) loaded
5ecdcaa7
VS
526 }
527
528 bookr = new wxHtmlBookRecord(bookfile.GetLocation(), fsys.GetPath(), title, deftopic);
d1da8872 529
91fa114d
VS
530 wxHtmlHelpDataItem *bookitem = new wxHtmlHelpDataItem;
531 bookitem->level = 0;
532 bookitem->id = 0;
533 bookitem->page = deftopic;
534 bookitem->name = title;
535 bookitem->book = bookr;
8ec2b484
HH
536
537 // store the contents index for later
91fa114d
VS
538 int cont_start = m_contents.size();
539
540 m_contents.Add(bookitem);
8ec2b484
HH
541
542 // Try to find cached binary versions:
f35822af
VS
543 // 1. save file as book, but with .hhp.cached extension
544 // 2. same as 1. but in temp path
545 // 3. otherwise or if cache load failed, load it from MS.
04dbb646 546
f35822af 547 fi = fsys.OpenFile(bookfile.GetLocation() + wxT(".cached"));
04dbb646
VZ
548
549 if (fi == NULL ||
e2b87f38 550#if wxUSE_DATETIME
04dbb646 551 fi->GetModificationTime() < bookfile.GetModificationTime() ||
e2b87f38 552#endif // wxUSE_DATETIME
4f9297b0 553 !LoadCachedBook(bookr, fi->GetStream()))
f35822af
VS
554 {
555 if (fi != NULL) delete fi;
91fa114d
VS
556 fi = fsys.OpenFile(m_tempPath + wxFileNameFromPath(bookfile.GetLocation()) + wxT(".cached"));
557 if (m_tempPath.empty() || fi == NULL ||
e2b87f38 558#if wxUSE_DATETIME
04dbb646 559 fi->GetModificationTime() < bookfile.GetModificationTime() ||
e2b87f38 560#endif // wxUSE_DATETIME
4f9297b0 561 !LoadCachedBook(bookr, fi->GetStream()))
f35822af
VS
562 {
563 LoadMSProject(bookr, fsys, indexfile, contfile);
91fa114d 564 if (!m_tempPath.empty())
f35822af 565 {
91fa114d 566 wxFileOutputStream *outs = new wxFileOutputStream(m_tempPath +
29e60597 567 SafeFileName(wxFileNameFromPath(bookfile.GetLocation())) + wxT(".cached"));
f35822af
VS
568 SaveCachedBook(bookr, outs);
569 delete outs;
570 }
d5bb85a0 571 }
8ec2b484 572 }
04dbb646 573
f35822af 574 if (fi != NULL) delete fi;
8ec2b484
HH
575
576 // Now store the contents range
91fa114d 577 bookr->SetContentsRange(cont_start, m_contents.size());
04dbb646 578
3912b3f8
VS
579#if wxUSE_WCHAR_T
580 // MS HTML Help files [written by MS HTML Help Workshop] are broken
581 // in that the data are iso-8859-1 (including HTML entities), but must
582 // be interpreted as being in language's windows charset. Correct the
583 // differences here and also convert to wxConvLocal in ANSI build
67c276bd 584 if (encoding != wxFONTENCODING_SYSTEM)
3912b3f8
VS
585 {
586 #if wxUSE_UNICODE
587 #define CORRECT_STR(str, conv) \
588 str = wxString((str).mb_str(wxConvISO8859_1), conv)
589 #else
590 #define CORRECT_STR(str, conv) \
591 str = wxString((str).wc_str(conv), wxConvLocal)
592 #endif
67c276bd 593 wxCSConv conv(encoding);
91fa114d
VS
594 size_t IndexCnt = m_index.size();
595 size_t ContentsCnt = m_contents.size();
596 size_t i;
597 for (i = IndexOld; i < IndexCnt; i++)
f890e2d4 598 {
91fa114d 599 CORRECT_STR(m_index[i].name, conv);
f890e2d4 600 }
91fa114d 601 for (i = ContentsOld; i < ContentsCnt; i++)
3912b3f8 602 {
91fa114d 603 CORRECT_STR(m_contents[i].name, conv);
3912b3f8
VS
604 }
605 #undef CORRECT_STR
f890e2d4 606 }
0b4f47a3
DS
607#else
608 wxUnusedVar(IndexOld);
609 wxUnusedVar(ContentsOld);
67c276bd 610 wxASSERT_MSG(encoding == wxFONTENCODING_SYSTEM, wxT("Help files need charset conversion, but wxUSE_WCHAR_T is 0"));
3912b3f8 611#endif // wxUSE_WCHAR_T/!wxUSE_WCHAR_T
8ec2b484 612
91fa114d
VS
613 m_bookRecords.Add(bookr);
614 if (!m_index.empty())
615 {
616 m_index.Sort(wxHtmlHelpIndexCompareFunc);
617 }
f42b1601 618
91fa114d 619 return true;
8ec2b484
HH
620}
621
622
623bool wxHtmlHelpData::AddBook(const wxString& book)
624{
3527f29c
VS
625 wxString extension(book.Right(4).Lower());
626 if (extension == wxT(".zip") ||
627#if wxUSE_LIBMSPACK
628 extension == wxT(".chm") /*compressed html help book*/ ||
629#endif
630 extension == wxT(".htb") /*html book*/)
68364659
VS
631 {
632 wxFileSystem fsys;
633 wxString s;
d1da8872 634 bool rt = false;
68364659 635
3527f29c
VS
636#if wxUSE_LIBMSPACK
637 if (extension == wxT(".chm"))
638 s = fsys.FindFirst(book + wxT("#chm:*.hhp"), wxFILE);
639 else
640#endif
641 s = fsys.FindFirst(book + wxT("#zip:*.hhp"), wxFILE);
642
93763ad5 643 while (!s.empty())
68364659 644 {
d1da8872 645 if (AddBook(s)) rt = true;
68364659
VS
646 s = fsys.FindNext();
647 }
04dbb646 648
68364659
VS
649 return rt;
650 }
68364659 651
a509f830
VZ
652 wxFSFile *fi;
653 wxFileSystem fsys;
3dde6c72 654
a509f830
VZ
655 wxString title = _("noname"),
656 safetitle,
657 start = wxEmptyString,
658 contents = wxEmptyString,
659 index = wxEmptyString,
660 charset = wxEmptyString;
68364659 661
a509f830
VZ
662 fi = fsys.OpenFile(book);
663 if (fi == NULL)
664 {
665 wxLogError(_("Cannot open HTML help book: %s"), book.c_str());
d1da8872 666 return false;
68364659 667 }
a509f830
VZ
668 fsys.ChangePathTo(book);
669
670 const wxChar *lineptr;
671 wxChar linebuf[300];
672 wxString tmp;
673 wxHtmlFilterPlainText filter;
674 tmp = filter.ReadFile(*fi);
675 lineptr = tmp.c_str();
676
d1da8872 677 do
a509f830
VZ
678 {
679 lineptr = ReadLine(lineptr, linebuf, 300);
d1da8872 680
a509f830 681 for (wxChar *ch = linebuf; *ch != wxT('\0') && *ch != wxT('='); ch++)
42841dfc 682 *ch = (wxChar)wxTolower(*ch);
a509f830
VZ
683
684 if (wxStrstr(linebuf, _T("title=")) == linebuf)
685 title = linebuf + wxStrlen(_T("title="));
686 if (wxStrstr(linebuf, _T("default topic=")) == linebuf)
687 start = linebuf + wxStrlen(_T("default topic="));
688 if (wxStrstr(linebuf, _T("index file=")) == linebuf)
689 index = linebuf + wxStrlen(_T("index file="));
690 if (wxStrstr(linebuf, _T("contents file=")) == linebuf)
691 contents = linebuf + wxStrlen(_T("contents file="));
692 if (wxStrstr(linebuf, _T("charset=")) == linebuf)
693 charset = linebuf + wxStrlen(_T("charset="));
694 } while (lineptr != NULL);
d1da8872 695
5a969262
RR
696 wxFontEncoding enc = wxFONTENCODING_SYSTEM;
697#if wxUSE_FONTMAP
698 if (charset != wxEmptyString)
699 enc = wxFontMapper::Get()->CharsetToEncoding(charset);
700#endif
a509f830 701
67c276bd 702 bool rtval = AddBookParam(*fi, enc,
a509f830
VZ
703 title, contents, index, start, fsys.GetPath());
704 delete fi;
91fa114d
VS
705
706#if WXWIN_COMPATIBILITY_2_4
707 CleanCompatibilityData();
708#endif
709
a509f830 710 return rtval;
8ec2b484
HH
711}
712
713wxString wxHtmlHelpData::FindPageByName(const wxString& x)
714{
715 int cnt;
716 int i;
717 wxFileSystem fsys;
718 wxFSFile *f;
8ec2b484 719
735a74df 720 // 1. try to open given file:
91fa114d 721 cnt = m_bookRecords.GetCount();
04dbb646 722 for (i = 0; i < cnt; i++)
4f9297b0 723 {
91fa114d 724 f = fsys.OpenFile(m_bookRecords[i].GetFullPath(x));
04dbb646
VZ
725 if (f)
726 {
91fa114d 727 wxString url = m_bookRecords[i].GetFullPath(x);
8ec2b484
HH
728 delete f;
729 return url;
730 }
731 }
732
733
735a74df 734 // 2. try to find a book:
04dbb646 735 for (i = 0; i < cnt; i++)
4f9297b0 736 {
91fa114d
VS
737 if (m_bookRecords[i].GetTitle() == x)
738 return m_bookRecords[i].GetFullPath(m_bookRecords[i].GetStart());
8ec2b484
HH
739 }
740
735a74df 741 // 3. try to find in contents:
91fa114d 742 cnt = m_contents.size();
04dbb646 743 for (i = 0; i < cnt; i++)
4f9297b0 744 {
91fa114d
VS
745 if (m_contents[i].name == x)
746 return m_contents[i].GetFullPath();
8ec2b484
HH
747 }
748
749
735a74df 750 // 4. try to find in index:
91fa114d 751 cnt = m_index.size();
04dbb646 752 for (i = 0; i < cnt; i++)
4f9297b0 753 {
91fa114d
VS
754 if (m_index[i].name == x)
755 return m_index[i].GetFullPath();
8ec2b484
HH
756 }
757
735a74df
VZ
758 // 4b. if still not found, try case-insensitive comparison
759 for (i = 0; i < cnt; i++)
760 {
761 if (m_index[i].name.CmpNoCase(x) == 0)
762 return m_index[i].GetFullPath();
763 }
764
91fa114d 765 return wxEmptyString;
8ec2b484
HH
766}
767
768wxString wxHtmlHelpData::FindPageById(int id)
f42b1601 769{
91fa114d
VS
770 size_t cnt = m_contents.size();
771 for (size_t i = 0; i < cnt; i++)
4f9297b0 772 {
91fa114d 773 if (m_contents[i].id == id)
04dbb646 774 {
91fa114d 775 return m_contents[i].GetFullPath();
8ec2b484
HH
776 }
777 }
778
91fa114d
VS
779 return wxEmptyString;
780}
781
782#if WXWIN_COMPATIBILITY_2_4
783wxHtmlContentsItem::wxHtmlContentsItem()
d1da8872 784 : m_Level(0), m_ID(wxID_ANY), m_Name(NULL), m_Page(NULL), m_Book(NULL),
91fa114d
VS
785 m_autofree(false)
786{
787}
788
789wxHtmlContentsItem::wxHtmlContentsItem(const wxHtmlHelpDataItem& d)
790{
791 m_autofree = true;
792 m_Level = d.level;
793 m_ID = d.id;
794 m_Name = wxStrdup(d.name.c_str());
795 m_Page = wxStrdup(d.page.c_str());
796 m_Book = d.book;
797}
798
799wxHtmlContentsItem& wxHtmlContentsItem::operator=(const wxHtmlContentsItem& d)
800{
801 if (m_autofree)
802 {
803 free(m_Name);
804 free(m_Page);
805 }
806 m_autofree = true;
807 m_Level = d.m_Level;
808 m_ID = d.m_ID;
809 m_Name = d.m_Name ? wxStrdup(d.m_Name) : NULL;
810 m_Page = d.m_Page ? wxStrdup(d.m_Page) : NULL;
811 m_Book = d.m_Book;
812 return *this;
8ec2b484
HH
813}
814
91fa114d
VS
815wxHtmlContentsItem::~wxHtmlContentsItem()
816{
817 if (m_autofree)
818 {
819 free(m_Name);
820 free(m_Page);
821 }
822}
823
824wxHtmlContentsItem* wxHtmlHelpData::GetContents()
825{
826 if (!m_cacheContents && !m_contents.empty())
827 {
828 size_t len = m_contents.size();
829 m_cacheContents = new wxHtmlContentsItem[len];
830 for (size_t i = 0; i < len; i++)
831 m_cacheContents[i] = m_contents[i];
832 }
833 return m_cacheContents;
834}
835
836int wxHtmlHelpData::GetContentsCnt()
837{
838 return m_contents.size();
839}
840
841wxHtmlContentsItem* wxHtmlHelpData::GetIndex()
842{
843 if (!m_cacheContents && !m_index.empty())
844 {
845 size_t len = m_index.size();
846 m_cacheContents = new wxHtmlContentsItem[len];
847 for (size_t i = 0; i < len; i++)
848 m_cacheContents[i] = m_index[i];
849 }
850 return m_cacheContents;
851}
852
853int wxHtmlHelpData::GetIndexCnt()
854{
855 return m_index.size();
856}
857
858void wxHtmlHelpData::CleanCompatibilityData()
859{
860 delete[] m_cacheContents;
861 m_cacheContents = NULL;
862 delete[] m_cacheIndex;
863 m_cacheIndex = NULL;
864}
865#endif // WXWIN_COMPATIBILITY_2_4
866
8ec2b484
HH
867//----------------------------------------------------------------------------------
868// wxHtmlSearchStatus functions
869//----------------------------------------------------------------------------------
870
871wxHtmlSearchStatus::wxHtmlSearchStatus(wxHtmlHelpData* data, const wxString& keyword,
c4971147 872 bool case_sensitive, bool whole_words_only,
d5bb85a0 873 const wxString& book)
8ec2b484
HH
874{
875 m_Data = data;
876 m_Keyword = keyword;
877 wxHtmlBookRecord* bookr = NULL;
04dbb646 878 if (book != wxEmptyString)
4f9297b0 879 {
d5bb85a0 880 // we have to search in a specific book. Find it first
91fa114d 881 int i, cnt = data->m_bookRecords.GetCount();
d5bb85a0 882 for (i = 0; i < cnt; i++)
91fa114d 883 if (data->m_bookRecords[i].GetTitle() == book)
04dbb646 884 {
91fa114d 885 bookr = &(data->m_bookRecords[i]);
d5bb85a0
VS
886 m_CurIndex = bookr->GetContentsStart();
887 m_MaxIndex = bookr->GetContentsEnd();
888 break;
889 }
890 // check; we won't crash if the book doesn't exist, but it's Bad Anyway.
891 wxASSERT(bookr);
8ec2b484 892 }
04dbb646 893 if (! bookr)
4f9297b0 894 {
d5bb85a0
VS
895 // no book specified; search all books
896 m_CurIndex = 0;
91fa114d 897 m_MaxIndex = m_Data->m_contents.size();
8ec2b484 898 }
c4971147 899 m_Engine.LookFor(keyword, case_sensitive, whole_words_only);
8ec2b484 900 m_Active = (m_CurIndex < m_MaxIndex);
8ec2b484
HH
901}
902
91fa114d
VS
903#if WXWIN_COMPATIBILITY_2_4
904wxHtmlContentsItem* wxHtmlSearchStatus::GetContentsItem()
905{
906 static wxHtmlContentsItem it;
907 it = wxHtmlContentsItem(*m_CurItem);
908 return &it;
909}
910#endif
911
8ec2b484
HH
912bool wxHtmlSearchStatus::Search()
913{
8ec2b484 914 wxFSFile *file;
d5bb85a0 915 int i = m_CurIndex; // shortcut
91fa114d 916 bool found = false;
3912b3f8 917 wxString thepage;
8ec2b484 918
04dbb646 919 if (!m_Active)
4f9297b0 920 {
f35822af 921 // sanity check. Illegal use, but we'll try to prevent a crash anyway
50494a55 922 wxASSERT(m_Active);
91fa114d 923 return false;
8ec2b484
HH
924 }
925
8ec2b484 926 m_Name = wxEmptyString;
91fa114d
VS
927 m_CurItem = NULL;
928 thepage = m_Data->m_contents[i].page;
8ec2b484 929
b5a7b000
VS
930 m_Active = (++m_CurIndex < m_MaxIndex);
931 // check if it is same page with different anchor:
3912b3f8 932 if (!m_LastPage.empty())
b5a7b000 933 {
3912b3f8
VS
934 const wxChar *p1, *p2;
935 for (p1 = thepage.c_str(), p2 = m_LastPage.c_str();
b5a7b000
VS
936 *p1 != 0 && *p1 != _T('#') && *p1 == *p2; p1++, p2++) {}
937
938 m_LastPage = thepage;
939
940 if (*p1 == 0 || *p1 == _T('#'))
3912b3f8 941 return false;
b5a7b000
VS
942 }
943 else m_LastPage = thepage;
04dbb646 944
f35822af 945 wxFileSystem fsys;
91fa114d 946 file = fsys.OpenFile(m_Data->m_contents[i].book->GetFullPath(thepage));
04dbb646 947 if (file)
b5a7b000 948 {
2b5f62a0 949 if (m_Engine.Scan(*file))
468ae730 950 {
91fa114d
VS
951 m_Name = m_Data->m_contents[i].name;
952 m_CurItem = &m_Data->m_contents[i];
953 found = true;
d5bb85a0
VS
954 }
955 delete file;
8ec2b484 956 }
8ec2b484
HH
957 return found;
958}
959
d5bb85a0
VS
960
961
962
963
964
965
966
967//--------------------------------------------------------------------------------
2b5f62a0 968// wxHtmlSearchEngine
d5bb85a0
VS
969//--------------------------------------------------------------------------------
970
2b5f62a0 971void wxHtmlSearchEngine::LookFor(const wxString& keyword, bool case_sensitive, bool whole_words_only)
d5bb85a0 972{
c4971147
VS
973 m_CaseSensitive = case_sensitive;
974 m_WholeWords = whole_words_only;
3912b3f8 975 m_Keyword = keyword;
04dbb646 976
3444e4a8 977 if (!m_CaseSensitive)
3912b3f8 978 m_Keyword.LowerCase();
d5bb85a0
VS
979}
980
981
1a1dac18
MB
982static inline bool WHITESPACE(wxChar c)
983{
984 return c == _T(' ') || c == _T('\n') || c == _T('\r') || c == _T('\t');
985}
c4971147 986
21dc4638
VZ
987// replace continuous spaces by one single space
988static inline wxString CompressSpaces(const wxString & str)
989{
990 wxString buf;
991 buf.reserve( str.size() );
992
993 bool space_counted = false;
994 for( const wxChar * pstr = str.c_str(); *pstr; ++pstr )
995 {
996 wxChar ch = *pstr;
997 if( WHITESPACE( ch ) )
998 {
999 if( space_counted )
1000 {
1001 continue;
1002 }
1003 ch = _T(' ');
1004 space_counted = true;
1005 }
1006 else
1007 {
1008 space_counted = false;
1009 }
1010 buf += ch;
1011 }
1012
1013 return buf;
1014}
1015
2b5f62a0 1016bool wxHtmlSearchEngine::Scan(const wxFSFile& file)
d5bb85a0 1017{
3912b3f8 1018 wxASSERT_MSG(!m_Keyword.empty(), wxT("wxHtmlSearchEngine::LookFor must be called before scanning!"));
d5bb85a0 1019
2b5f62a0 1020 wxHtmlFilterHTML filter;
21dc4638 1021 wxString bufStr = filter.ReadFile(file);
d5bb85a0 1022
c4971147 1023 if (!m_CaseSensitive)
21dc4638 1024 bufStr.LowerCase();
d5bb85a0 1025
21dc4638
VZ
1026 { // remove html tags
1027 wxString bufStrCopy;
1028 bufStrCopy.reserve( bufStr.size() );
1029 bool insideTag = false;
1030 for (const wxChar * pBufStr = bufStr.c_str(); *pBufStr; ++pBufStr)
04dbb646 1031 {
21dc4638
VZ
1032 wxChar c = *pBufStr;
1033 if (insideTag)
1034 {
1035 if (c == _T('>'))
1036 {
1037 insideTag = false;
1038 // replace the tag by an empty space
1039 c = _T(' ');
1040 }
1041 else
1042 continue;
1043 }
1044 else if (c == _T('<'))
1045 {
1046 wxChar nextCh = *(pBufStr + 1);
1047 if (nextCh == _T('/') || !WHITESPACE(nextCh))
1048 {
1049 insideTag = true;
1050 continue;
1051 }
1052 }
1053 bufStrCopy += c;
c4971147 1054 }
21dc4638 1055 bufStr.swap( bufStrCopy );
c4971147 1056 }
04dbb646 1057
21dc4638
VZ
1058 wxString keyword = m_Keyword;
1059
1060 if (m_WholeWords)
c4971147 1061 {
21dc4638
VZ
1062 // insert ' ' at the beginning and at the end
1063 keyword.insert( 0, _T(" ") );
1064 keyword.append( _T(" ") );
1065 bufStr.insert( 0, _T(" ") );
1066 bufStr.append( _T(" ") );
d5bb85a0
VS
1067 }
1068
21dc4638
VZ
1069 // remove continuous spaces
1070 keyword = CompressSpaces( keyword );
1071 bufStr = CompressSpaces( bufStr );
d5bb85a0 1072
21dc4638
VZ
1073 // finally do the search
1074 return bufStr.find( keyword ) != wxString::npos;
1075}
d5bb85a0 1076
8ec2b484 1077#endif