]> git.saurik.com Git - wxWidgets.git/blame - src/html/htmlfilt.cpp
avoid buffer overrun
[wxWidgets.git] / src / html / htmlfilt.cpp
CommitLineData
5526e819 1/////////////////////////////////////////////////////////////////////////////
69941f05 2// Name: htmlfilt.cpp
5526e819
VS
3// Purpose: wxHtmlFilter - input filter for translating into HTML format
4// Author: Vaclav Slavik
69941f05 5// RCS-ID: $Id$
5526e819 6// Copyright: (c) 1999 Vaclav Slavik
65571936 7// Licence: wxWindows licence
5526e819
VS
8/////////////////////////////////////////////////////////////////////////////
9
10
14f355c2 11#if defined(__GNUG__) && !defined(NO_GCC_PRAGMA)
1aedb1dd 12#pragma implementation "htmlfilt.h"
5526e819
VS
13#endif
14
4dcaf11a 15#include "wx/wxprec.h"
5526e819 16
314260fb 17#include "wx/defs.h"
f6bcfd97 18#if wxUSE_HTML && wxUSE_STREAMS
5526e819 19
2b5f62a0 20#ifdef __BORLANDC__
5526e819
VS
21#pragma hdrstop
22#endif
23
24#ifndef WXPRECOMP
04dbb646
VZ
25 #include "wx/log.h"
26 #include "wx/intl.h"
5526e819
VS
27#endif
28
2b5f62a0 29#include "wx/strconv.h"
69941f05 30#include "wx/html/htmlfilt.h"
4dcaf11a 31#include "wx/html/htmlwin.h"
5526e819 32
eb37e1d2 33// utility function: read a wxString from a wxInputStream
2b5f62a0 34static void ReadString(wxString& str, wxInputStream* s, wxMBConv& conv)
eb37e1d2
MB
35{
36 size_t streamSize = s->GetSize();
37
2b5f62a0 38 if (streamSize == ~(size_t)0)
eb37e1d2
MB
39 {
40 const size_t bufSize = 4095;
41 char buffer[bufSize+1];
42 size_t lastRead;
43
44 do
45 {
46 s->Read(buffer, bufSize);
47 lastRead = s->LastRead();
48 buffer[lastRead] = 0;
2b5f62a0 49 str.Append(wxString(buffer, conv));
eb37e1d2 50 }
2b5f62a0 51 while (lastRead == bufSize);
eb37e1d2
MB
52 }
53 else
54 {
55 char* src = new char[streamSize+1];
56 s->Read(src, streamSize);
57 src[streamSize] = 0;
2b5f62a0
VZ
58 str = wxString(src, conv);
59 delete[] src;
eb37e1d2
MB
60 }
61}
5526e819
VS
62
63/*
64
65There is code for several default filters:
66
67*/
68
69IMPLEMENT_ABSTRACT_CLASS(wxHtmlFilter, wxObject)
70
71//--------------------------------------------------------------------------------
72// wxHtmlFilterPlainText
73// filter for text/plain or uknown
74//--------------------------------------------------------------------------------
75
76IMPLEMENT_DYNAMIC_CLASS(wxHtmlFilterPlainText, wxHtmlFilter)
77
a4c97004 78bool wxHtmlFilterPlainText::CanRead(const wxFSFile& WXUNUSED(file)) const
5526e819 79{
d1da8872 80 return true;
5526e819
VS
81}
82
83
84
420ec58a 85wxString wxHtmlFilterPlainText::ReadFile(const wxFSFile& file) const
5526e819
VS
86{
87 wxInputStream *s = file.GetStream();
5526e819
VS
88 wxString doc, doc2;
89
90 if (s == NULL) return wxEmptyString;
2b5f62a0 91 ReadString(doc, s, wxConvISO8859_1);
5526e819 92
d1da8872
WS
93 doc.Replace(wxT("&"), wxT("&"), true);
94 doc.Replace(wxT("<"), wxT("&lt;"), true);
95 doc.Replace(wxT(">"), wxT("&gt;"), true);
2b5f62a0 96 doc2 = wxT("<HTML><BODY><PRE>\n") + doc + wxT("\n</PRE></BODY></HTML>");
5526e819
VS
97 return doc2;
98}
99
100
101
102
103
104//--------------------------------------------------------------------------------
105// wxHtmlFilterImage
106// filter for image/*
107//--------------------------------------------------------------------------------
108
109class wxHtmlFilterImage : public wxHtmlFilter
110{
111 DECLARE_DYNAMIC_CLASS(wxHtmlFilterImage)
112
113 public:
420ec58a
VS
114 virtual bool CanRead(const wxFSFile& file) const;
115 virtual wxString ReadFile(const wxFSFile& file) const;
5526e819
VS
116};
117
118IMPLEMENT_DYNAMIC_CLASS(wxHtmlFilterImage, wxHtmlFilter)
119
120
121
420ec58a 122bool wxHtmlFilterImage::CanRead(const wxFSFile& file) const
5526e819 123{
0413cec5 124 return (file.GetMimeType().Left(6) == wxT("image/"));
5526e819
VS
125}
126
127
128
420ec58a 129wxString wxHtmlFilterImage::ReadFile(const wxFSFile& file) const
5526e819 130{
2b5f62a0
VZ
131 wxString res = wxT("<HTML><BODY><IMG SRC=\"") + file.GetLocation() + wxT("\"></BODY></HTML>");
132 return res;
5526e819
VS
133}
134
135
136
137
138//--------------------------------------------------------------------------------
2b5f62a0
VZ
139// wxHtmlFilterHTML
140// filter for text/html
5526e819
VS
141//--------------------------------------------------------------------------------
142
5526e819
VS
143
144IMPLEMENT_DYNAMIC_CLASS(wxHtmlFilterHTML, wxHtmlFilter)
145
420ec58a 146bool wxHtmlFilterHTML::CanRead(const wxFSFile& file) const
5526e819 147{
f61815af
GL
148// return (file.GetMimeType() == "text/html");
149// This is true in most case but some page can return:
150// "text/html; char-encoding=...."
151// So we use Find instead
77611ad4 152 return (file.GetMimeType().Find(wxT("text/html")) == 0);
5526e819
VS
153}
154
155
156
420ec58a 157wxString wxHtmlFilterHTML::ReadFile(const wxFSFile& file) const
5526e819
VS
158{
159 wxInputStream *s = file.GetStream();
5526e819
VS
160 wxString doc;
161
04dbb646 162 if (s == NULL)
f3c82859 163 {
f6bcfd97 164 wxLogError(_("Cannot open HTML document: %s"), file.GetLocation().c_str());
f3c82859
VS
165 return wxEmptyString;
166 }
5526e819 167
d1da8872 168 // NB: We convert input file to wchar_t here in Unicode mode, based on
2b5f62a0
VZ
169 // either Content-Type header or <meta> tags. In ANSI mode, we don't
170 // do it as it is done by wxHtmlParser (for this reason, we add <meta>
171 // tag if we used Content-Type header).
172#if wxUSE_UNICODE
d1da8872 173 int charsetPos;
2b5f62a0
VZ
174 if ((charsetPos = file.GetMimeType().Find(_T("; charset="))) != wxNOT_FOUND)
175 {
176 wxString charset = file.GetMimeType().Mid(charsetPos + 10);
177 wxCSConv conv(charset);
178 ReadString(doc, s, conv);
179 }
180 else
181 {
182 wxString tmpdoc;
183 ReadString(tmpdoc, s, wxConvISO8859_1);
184 wxString charset = wxHtmlParser::ExtractCharsetInformation(tmpdoc);
185 if (charset.empty())
186 doc = tmpdoc;
187 else
188 {
189 wxCSConv conv(charset);
190 doc = wxString(tmpdoc.mb_str(wxConvISO8859_1), conv);
191 }
192 }
193#else // !wxUSE_UNICODE
194 ReadString(doc, s, wxConvLibc);
04dbb646 195 // add meta tag if we obtained this through http:
2b5f62a0 196 if (!file.GetMimeType().empty())
981e62aa 197 {
2b5f62a0
VZ
198 wxString hdr;
199 wxString mime = file.GetMimeType();
200 hdr.Printf(_T("<meta http-equiv=\"Content-Type\" content=\"%s\">"), mime.c_str());
201 return hdr+doc;
981e62aa 202 }
2b5f62a0 203#endif
981e62aa 204
3ca6a5f0 205 return doc;
5526e819
VS
206}
207
208
209
210
211///// Module:
212
213class wxHtmlFilterModule : public wxModule
214{
215 DECLARE_DYNAMIC_CLASS(wxHtmlFilterModule)
216
217 public:
218 virtual bool OnInit()
219 {
220 wxHtmlWindow::AddFilter(new wxHtmlFilterHTML);
221 wxHtmlWindow::AddFilter(new wxHtmlFilterImage);
d1da8872 222 return true;
5526e819
VS
223 }
224 virtual void OnExit() {}
225};
226
227IMPLEMENT_DYNAMIC_CLASS(wxHtmlFilterModule, wxModule)
228
8dd71e2b 229#endif