]>
git.saurik.com Git - wxWidgets.git/blob - src/html/chm.cpp
1 /////////////////////////////////////////////////////////////////////////////
2 // Name: src/html/chm.cpp
3 // Purpose: CHM (Help) support for wxHTML
4 // Author: Markus Sinner
5 // Copyright: (c) 2003 Herd Software Development
7 // Licence: wxWindows licence
8 /////////////////////////////////////////////////////////////////////////////
10 #include "wx/wxprec.h"
23 #include "wx/module.h"
26 #include "wx/filesys.h"
27 #include "wx/mstream.h"
28 #include "wx/wfstream.h"
30 #include "wx/html/forcelnk.h"
31 FORCE_LINK_ME(wxhtml_chm_support
)
33 // ----------------------------------------------------------------------------
36 /// this class is used to abstract access to CHM-Archives
37 /// with library mspack written by Stuart Caie
38 /// http://www.kyz.uklinux.net/libmspack/
39 // ----------------------------------------------------------------------------
44 wxChmTools(const wxFileName
&archive
);
48 /// Generate error-string for error-code
49 static const wxString
ChmErrorMsg(int error
);
51 /// get an array of archive-member-filenames
52 const wxArrayString
*GetFileNames()
57 /// get the name of the archive representated by this class
58 const wxString
GetArchiveName()
63 /// Find a file in the archive
64 const wxString
Find(const wxString
& pattern
,
65 const wxString
& startfrom
= wxEmptyString
);
67 /// Extract a file in the archive into a file
68 size_t Extract(const wxString
& pattern
, const wxString
& filename
);
70 /// check archive for a file
71 bool Contains(const wxString
& pattern
);
73 /// get a string for the last error which occurred
74 const wxString
GetLastErrorMessage();
80 // these vars are used by FindFirst/Next:
81 wxString m_chmFileName
;
82 char *m_chmFileNameANSI
;
84 /// mspack-pointer to mschmd_header
85 struct mschmd_header
*m_archive
;
86 /// mspack-pointer to mschm_decompressor
87 struct mschm_decompressor
*m_decompressor
;
89 /// Array of filenames in archive
90 wxArrayString
* m_fileNames
;
92 /// Internal function to get filepointer
93 struct mschmd_file
*GetMschmdFile(const wxString
& pattern
);
100 * @param archive The filename of the archive to open
102 wxChmTools::wxChmTools(const wxFileName
&archive
)
104 m_chmFileName
= archive
.GetFullPath();
106 wxASSERT_MSG( !m_chmFileName
.empty(), _T("empty archive name") );
109 m_decompressor
= NULL
;
113 struct mschmd_header
*chmh
;
114 struct mschm_decompressor
*chmd
;
115 struct mschmd_file
*file
;
117 // Create decompressor
118 chmd
= mspack_create_chm_decompressor(NULL
);
119 m_decompressor
= (struct mschm_decompressor
*) chmd
;
121 // NB: we must make a copy of the string because chmd->open won't call
122 // strdup() [libmspack-20030726], which would cause crashes in
123 // Unicode build when mb_str() returns temporary buffer
124 m_chmFileNameANSI
= strdup((const char*)m_chmFileName
.mb_str(wxConvFile
));
126 // Open the archive and store it in class:
127 if ( (chmh
= chmd
->open(chmd
, (char*)m_chmFileNameANSI
)) )
131 // Create Filenamearray
132 m_fileNames
= new wxArrayString
;
134 // Store Filenames in array
135 for (file
= chmh
->files
; file
; file
= file
->next
)
137 m_fileNames
->Add(wxString::FromAscii(file
->filename
));
142 wxLogError(_("Failed to open CHM archive '%s'."),
143 archive
.GetFullPath().c_str());
144 m_lasterror
= (chmd
->last_error(chmd
));
153 wxChmTools::~wxChmTools()
155 struct mschm_decompressor
*chmd
= m_decompressor
;
156 struct mschmd_header
*chmh
= m_archive
;
162 chmd
->close(chmd
, chmh
);
164 free(m_chmFileNameANSI
);
166 // Destroy Decompressor
168 mspack_destroy_chm_decompressor(chmd
);
174 * Checks if the given pattern matches to any
175 * filename stored in archive
177 * @param pattern The filename pattern, may include '*' and/or '?'
178 * @return true, if any file matching pattern has been found,
181 bool wxChmTools::Contains(const wxString
& pattern
)
184 wxString pattern_tmp
= wxString(pattern
).MakeLower();
186 // loop through filearay
187 if ( m_fileNames
&& (count
= m_fileNames
->GetCount()) > 0 )
189 for (int i
= 0; i
< count
; i
++)
191 wxString tmp
= m_fileNames
->Item(i
).MakeLower();
192 if ( tmp
.Matches(pattern_tmp
) || tmp
.Mid(1).Matches(pattern_tmp
))
205 * Finds the next file descibed by a pattern in the archive, starting
206 * the file given by second parameter
208 * @param pattern The file-pattern to search for. May contain '*' and/or '?'
209 * @param startfrom The filename which the search should start after
210 * @returns The full pathname of the found file
212 const wxString
wxChmTools::Find(const wxString
& pattern
,
213 const wxString
& startfrom
)
217 wxString
pattern_tmp(pattern
);
218 wxString
startfrom_tmp(startfrom
);
219 pattern_tmp
.MakeLower();
220 startfrom_tmp
.MakeLower();
222 if ( m_fileNames
&& (count
= m_fileNames
->GetCount()) > 0 )
224 for (int i
= 0; i
< count
; i
++)
226 tmp
= m_fileNames
->Item(i
).MakeLower();
227 // if we find the string where the search should began
228 if ( tmp
.Matches(startfrom_tmp
) ||
229 tmp
.Mid(1).Matches(startfrom_tmp
) )
231 if ( tmp
.Matches(pattern_tmp
) ||
232 tmp
.Mid(1).Matches(pattern_tmp
) )
239 return wxEmptyString
;
246 * extracts the first hit of pattern to the given position
248 * @param pattern A filename pattern (may contain * and ? chars)
249 * @param filename The FileName where to temporary extract the file to
250 * @return 0 at no file extracted<br>
251 * number of bytes extracted else
253 size_t wxChmTools::Extract(const wxString
& pattern
, const wxString
& filename
)
255 struct mschm_decompressor
*d
= m_decompressor
;
256 struct mschmd_header
*h
= m_archive
;
257 struct mschmd_file
*f
;
260 wxString pattern_tmp
= (wxString(pattern
)).MakeLower();
262 for (f
= h
->files
; f
; f
= f
->next
)
264 tmp
= wxString::FromAscii(f
->filename
).MakeLower();
265 if ( tmp
.Matches(pattern_tmp
) ||
266 tmp
.Mid(1).Matches(pattern_tmp
) )
268 // ignore leading '/'
270 (char*)(const char*)filename
.mb_str(wxConvFile
)))
273 m_lasterror
= d
->last_error(d
);
274 wxLogError(_("Could not extract %s into %s: %s"),
275 wxString::FromAscii(f
->filename
).c_str(),
277 ChmErrorMsg(m_lasterror
).c_str());
282 return (size_t) f
->length
;
293 * Find a file by pattern
295 * @param pattern A filename pattern (may contain * and ? chars)
296 * @return A pointer to the file (mschmd_file*)
298 struct mschmd_file
*wxChmTools::GetMschmdFile(const wxString
& pattern_orig
)
300 struct mschmd_file
*f
;
301 struct mschmd_header
*h
= (struct mschmd_header
*) m_archive
;
303 wxString pattern
= wxString(pattern_orig
).MakeLower();
305 for (f
= h
->files
; f
; f
= f
->next
)
307 tmp
= wxString::FromAscii(f
->filename
).MakeLower();
308 if ( tmp
.Matches(pattern
) || tmp
.Mid(1).Matches(pattern
) )
310 // ignore leading '/'
318 const wxString
wxChmTools::GetLastErrorMessage()
320 return ChmErrorMsg(m_lasterror
);
323 const wxString
wxChmTools::ChmErrorMsg(int error
)
328 return _("no error");
329 case MSPACK_ERR_ARGS
:
330 return _("bad arguments to library function");
331 case MSPACK_ERR_OPEN
:
332 return _("error opening file");
333 case MSPACK_ERR_READ
:
334 return _("read error");
335 case MSPACK_ERR_WRITE
:
336 return _("write error");
337 case MSPACK_ERR_SEEK
:
338 return _("seek error");
339 case MSPACK_ERR_NOMEMORY
:
340 return _("out of memory");
341 case MSPACK_ERR_SIGNATURE
:
342 return _("bad signature");
343 case MSPACK_ERR_DATAFORMAT
:
344 return _("error in data format");
345 case MSPACK_ERR_CHECKSUM
:
346 return _("checksum error");
347 case MSPACK_ERR_CRUNCH
:
348 return _("compression error");
349 case MSPACK_ERR_DECRUNCH
:
350 return _("decompression error");
352 return _("unknown error");
356 // ---------------------------------------------------------------------------
358 // ---------------------------------------------------------------------------
360 class wxChmInputStream
: public wxInputStream
364 wxChmInputStream(const wxString
& archive
,
365 const wxString
& file
, bool simulate
= false);
369 /// Return the size of the accessed file in archive
370 virtual size_t GetSize() const { return m_size
; }
372 virtual bool Eof() const;
373 /// Set simulation-mode of HHP-File (if non is found)
374 void SimulateHHP(bool sim
) { m_simulateHHP
= sim
; }
377 /// See wxInputStream
378 virtual size_t OnSysRead(void *buffer
, size_t bufsize
);
379 /// See wxInputStream
380 virtual wxFileOffset
OnSysSeek(wxFileOffset seek
, wxSeekMode mode
);
381 /// See wxInputStream
382 virtual wxFileOffset
OnSysTell() const { return m_pos
; }
390 wxInputStream
* m_contentStream
;
392 void CreateHHPStream();
393 bool CreateFileStream(const wxString
& pattern
);
394 // this void* is handle of archive . I'm sorry it is void and not proper
395 // type but I don't want to make unzip.h header public.
398 // locates the file and returns a mspack_file *
399 mspack_file
*LocateFile(wxString filename
);
401 // should store pointer to current file
404 // The Chm-Class for extracting the data
413 * @param archive The name of the .chm archive. Remember that archive must
414 * be local file accesible via fopen, fread functions!
415 * @param filename The Name of the file to be extracted from archive
416 * @param simulate if true than class should simulate .HHP-File based on #SYSTEM
417 * if false than class does nothing if it doesnt find .hhp
419 wxChmInputStream::wxChmInputStream(const wxString
& archive
,
420 const wxString
& filename
, bool simulate
)
426 m_contentStream
= NULL
;
427 m_lasterror
= wxSTREAM_NO_ERROR
;
428 m_chm
= new wxChmTools (wxFileName(archive
));
430 m_fileName
= wxString(filename
).MakeLower();
431 m_simulateHHP
= simulate
;
433 if ( !m_chm
->Contains(m_fileName
) )
435 // if the file could not be located, but was *.hhp, than we create
436 // the content of the hhp-file on the fly and store it for reading
437 // by the application
438 if ( m_fileName
.Find(_T(".hhp")) != wxNOT_FOUND
&& m_simulateHHP
)
440 // now we open an hhp-file
445 wxLogError(_("Could not locate file '%s'."), filename
.c_str());
446 m_lasterror
= wxSTREAM_READ_ERROR
;
452 CreateFileStream(m_fileName
);
457 wxChmInputStream::~wxChmInputStream()
461 delete m_contentStream
;
470 bool wxChmInputStream::Eof() const
472 return (m_content
==NULL
||
473 m_contentStream
==NULL
||
474 m_contentStream
->Eof() ||
480 size_t wxChmInputStream::OnSysRead(void *buffer
, size_t bufsize
)
482 if ( m_pos
>= m_size
)
484 m_lasterror
= wxSTREAM_EOF
;
487 m_lasterror
= wxSTREAM_NO_ERROR
;
489 // If the rest to read from the stream is less
490 // than the buffer size, than only read the rest
491 if ( m_pos
+ bufsize
> m_size
)
492 bufsize
= m_size
- m_pos
;
494 m_contentStream
->SeekI(m_pos
);
495 m_contentStream
->Read(buffer
, bufsize
);
497 m_contentStream
->SeekI(m_pos
);
504 wxFileOffset
wxChmInputStream::OnSysSeek(wxFileOffset seek
, wxSeekMode mode
)
506 wxString mode_str
= wxEmptyString
;
508 if ( !m_contentStream
|| m_contentStream
->Eof() )
510 m_lasterror
= wxSTREAM_EOF
;
513 m_lasterror
= wxSTREAM_NO_ERROR
;
515 wxFileOffset nextpos
;
520 nextpos
= seek
+ m_pos
;
526 nextpos
= m_size
- 1 + seek
;
530 break; /* just to fool compiler, never happens */
534 // Set current position on stream
535 m_contentStream
->SeekI(m_pos
);
542 * Help Browser tries to read the contents of the
543 * file by interpreting a .hhp file in the Archiv.
544 * For .chm doesnt include such a file, we need
545 * to rebuild the information based on stored
549 wxChmInputStream::CreateHHPStream()
556 wxMemoryOutputStream
*out
;
559 // Try to open the #SYSTEM-File and create the HHP File out of it
560 // see http://bonedaddy.net/pabs3/chmspec/0.1.2/Internal.html#SYSTEM
561 if ( ! m_chm
->Contains(_T("/#SYSTEM")) )
564 wxLogDebug(_("Archive doesnt contain #SYSTEM file"));
570 file
= wxFileName(_T("/#SYSTEM"));
573 if ( CreateFileStream(_T("/#SYSTEM")) )
575 // New stream for writing a memory area to simulate the
577 out
= new wxMemoryOutputStream();
579 tmp
= "[OPTIONS]\r\n";
580 out
->Write((const void *) tmp
, strlen(tmp
));
586 // use the actual stream for reading
589 /* Now read the contents, and try to get the needed information */
591 // First 4 Bytes are Version information, skip
596 // Read #SYSTEM-Code and length
598 code
= wxUINT16_SWAP_ON_BE( code
) ;
600 len
= wxUINT16_SWAP_ON_BE( len
) ;
607 case 0: // CONTENTS_FILE
608 tmp
= "Contents file=";
611 case 1: // INDEX_FILE
615 case 2: // DEFAULT_TOPIC
616 tmp
= "Default Topic=";
622 // case 6: // COMPILED_FILE
623 // tmp = "Compiled File=";
625 case 7: // COMPILED_FILE
626 tmp
= "Binary Index=YES\r\n";
627 out
->Write( (const void *) tmp
, strlen(tmp
));
630 case 4: // STRUCT SYSTEM INFO
634 char *structptr
= (char*) buf
;
635 // LCID at position 0
636 wxUint32 dummy
= *((wxUint32
*)(structptr
+0)) ;
637 wxUint32 lcid
= wxUINT32_SWAP_ON_BE( dummy
) ;
639 msg
.Printf(_T("Language=0x%X\r\n"),lcid
) ;
640 out
->Write(msg
.c_str() , msg
.length() ) ;
649 out
->Write((const void *) tmp
, strlen(tmp
));
650 out
->Write(buf
, strlen((char*)buf
));
651 out
->Write("\r\n", 2);
659 // Free the old data which wont be used any more
660 delete m_contentStream
;
664 // Now add entries which are missing
665 if ( !hhc
&& m_chm
->Contains(_T("*.hhc")) )
667 tmp
= "Contents File=*.hhc\r\n";
668 out
->Write((const void *) tmp
, strlen(tmp
));
671 if ( !hhk
&& m_chm
->Contains(_T("*.hhk")) )
673 tmp
= "Index File=*.hhk\r\n";
674 out
->Write((const void *) tmp
, strlen(tmp
));
677 // Now copy the Data from the memory
678 out
->SeekO(0, wxFromEnd
);
679 m_size
= out
->TellO();
680 out
->SeekO(0, wxFromStart
);
681 m_content
= (char *) malloc (m_size
+1);
682 out
->CopyTo(m_content
, m_size
);
683 m_content
[m_size
]='\0';
685 m_contentStream
= new wxMemoryInputStream(m_content
, m_size
);
693 * Creates a Stream pointing to a virtual file in
694 * the current archive
696 bool wxChmInputStream::CreateFileStream(const wxString
& pattern
)
698 wxFileInputStream
* fin
;
699 wxString tmpfile
= wxFileName::CreateTempFileName(_T("chmstrm"), NULL
);
701 if ( tmpfile
.empty() )
703 wxLogError(_("Could not create temporary file '%s'"), tmpfile
.c_str());
707 // try to extract the file
708 if ( m_chm
->Extract(pattern
, tmpfile
) <= 0 )
710 wxLogError(_("Extraction of '%s' into '%s' failed."),
711 pattern
.c_str(), tmpfile
.c_str());
712 if ( wxFileExists(tmpfile
) )
713 wxRemoveFile(tmpfile
);
718 // Open a filestream to extracted file
719 fin
= new wxFileInputStream(tmpfile
);
720 m_size
= fin
->GetSize();
721 m_content
= (char *) malloc(m_size
+1);
722 fin
->Read(m_content
, m_size
);
723 m_content
[m_size
]='\0';
725 wxRemoveFile(tmpfile
);
729 m_contentStream
= new wxMemoryInputStream (m_content
, m_size
);
731 return m_contentStream
->IsOk();
737 // ----------------------------------------------------------------------------
739 // ----------------------------------------------------------------------------
741 class wxChmFSHandler
: public wxFileSystemHandler
744 /// Constructor and Destructor
748 /// Is able to open location?
749 virtual bool CanOpen(const wxString
& location
);
751 virtual wxFSFile
* OpenFile(wxFileSystem
& fs
, const wxString
& location
);
752 /// Find first occurrence of spec
753 virtual wxString
FindFirst(const wxString
& spec
, int flags
= 0);
754 /// Find next occurrence of spec
755 virtual wxString
FindNext();
764 wxChmFSHandler::wxChmFSHandler() : wxFileSystemHandler()
767 m_pattern
=wxEmptyString
;
768 m_found
=wxEmptyString
;
772 wxChmFSHandler::~wxChmFSHandler()
778 bool wxChmFSHandler::CanOpen(const wxString
& location
)
780 wxString p
= GetProtocol(location
);
781 return (p
== _T("chm")) &&
782 (GetProtocol(GetLeftLocation(location
)) == _T("file"));
785 wxFSFile
* wxChmFSHandler::OpenFile(wxFileSystem
& WXUNUSED(fs
),
786 const wxString
& location
)
788 wxString right
= GetRightLocation(location
);
789 wxString left
= GetLeftLocation(location
);
795 if ( GetProtocol(left
) != _T("file") )
797 wxLogError(_("CHM handler currently supports only local files!"));
801 // Work around javascript
802 wxString tmp
= wxString(right
);
803 if ( tmp
.MakeLower().Contains(_T("javascipt")) && tmp
.Contains(_T("\'")) )
805 right
= right
.AfterFirst(_T('\'')).BeforeLast(_T('\''));
808 // now work on the right location
809 if (right
.Contains(_T("..")))
811 wxFileName
abs(right
);
812 abs
.MakeAbsolute(_T("/"));
813 right
= abs
.GetFullPath();
816 // a workaround for absolute links to root
817 if ( (index
=right
.Index(_T("//"))) != wxNOT_FOUND
)
819 right
=wxString(right
.Mid(index
+1));
820 wxLogWarning(_("Link contained '//', converted to absolute link."));
823 wxFileName leftFilename
= wxFileSystem::URLToFileName(left
);
825 // Open a stream to read the content of the chm-file
826 s
= new wxChmInputStream(leftFilename
.GetFullPath(), right
, true);
828 wxString mime
= GetMimeTypeFromExt(location
);
832 return new wxFSFile(s
,
833 left
+ _T("#chm:") + right
,
836 wxDateTime(wxFileModificationTime(left
)));
846 * Doku see wxFileSystemHandler
848 wxString
wxChmFSHandler::FindFirst(const wxString
& spec
, int flags
)
850 wxString right
= GetRightLocation(spec
);
851 wxString left
= GetLeftLocation(spec
);
852 wxString nativename
= wxFileSystem::URLToFileName(left
).GetFullPath();
854 if ( GetProtocol(left
) != _T("file") )
856 wxLogError(_("CHM handler currently supports only local files!"));
857 return wxEmptyString
;
860 m_chm
= new wxChmTools(wxFileName(nativename
));
861 m_pattern
= right
.AfterLast(_T('/'));
863 wxString m_found
= m_chm
->Find(m_pattern
);
865 // now fake around hhp-files which are not existing in projects...
866 if (m_found
.empty() &&
867 m_pattern
.Contains(_T(".hhp")) &&
868 !m_pattern
.Contains(_T(".hhp.cached")))
870 m_found
.Printf(_T("%s#chm:%s.hhp"),
871 left
.c_str(), m_pattern
.BeforeLast(_T('.')).c_str());
880 wxString
wxChmFSHandler::FindNext()
882 if (m_pattern
.empty())
883 return wxEmptyString
;
885 return m_chm
->Find(m_pattern
, m_found
);
888 // ---------------------------------------------------------------------------
889 // wxModule to register CHM handler
890 // ---------------------------------------------------------------------------
892 class wxChmSupportModule
: public wxModule
894 DECLARE_DYNAMIC_CLASS(wxChmSupportModule
)
897 virtual bool OnInit()
899 wxFileSystem::AddHandler(new wxChmFSHandler
);
902 virtual void OnExit() {}
906 IMPLEMENT_DYNAMIC_CLASS(wxChmSupportModule
, wxModule
)
908 #endif // wxUSE_LIBMSPACK