]> git.saurik.com Git - wxWidgets.git/blob - src/html/htmlpars.cpp
fixed incorrect parsing of http://domain.com:portnumber/
[wxWidgets.git] / src / html / htmlpars.cpp
1 /////////////////////////////////////////////////////////////////////////////
2 // Name: htmlpars.cpp
3 // Purpose: wxHtmlParser class (generic parser)
4 // Author: Vaclav Slavik
5 // RCS-ID: $Id$
6 // Copyright: (c) 1999 Vaclav Slavik
7 // Licence: wxWindows Licence
8 /////////////////////////////////////////////////////////////////////////////
9
10
11 #ifdef __GNUG__
12 #pragma implementation
13 #endif
14
15 #include "wx/wxprec.h"
16
17 #include "wx/defs.h"
18 #if wxUSE_HTML
19
20 #ifdef __BORDLANDC__
21 #pragma hdrstop
22 #endif
23
24 #ifndef WXPRECOMP
25 #include "wx/wx.h"
26 #endif
27
28 #include "wx/tokenzr.h"
29 #include "wx/wfstream.h"
30 #include "wx/url.h"
31 #include "wx/html/htmldefs.h"
32 #include "wx/html/htmlpars.h"
33
34
35
36 //-----------------------------------------------------------------------------
37 // wxHtmlParser
38 //-----------------------------------------------------------------------------
39
40 IMPLEMENT_ABSTRACT_CLASS(wxHtmlParser,wxObject)
41
42
43 wxObject* wxHtmlParser::Parse(const wxString& source)
44 {
45 wxObject *result;
46
47 InitParser(source);
48 DoParsing();
49 result = GetProduct();
50 DoneParser();
51 return result;
52 }
53
54
55
56 void wxHtmlParser::InitParser(const wxString& source)
57 {
58 m_Source = source;
59 m_Cache = new wxHtmlTagsCache(m_Source);
60 }
61
62
63
64 void wxHtmlParser::DoneParser()
65 {
66 delete m_Cache;
67 m_Cache = NULL;
68 }
69
70
71
72 #define wxHTML_MAX_BUFLEN 1024
73
74 void wxHtmlParser::DoParsing(int begin_pos, int end_pos)
75 {
76 char temp[wxHTML_BUFLEN], c;
77 int i;
78 int templen;
79
80 templen = 0;
81 i = begin_pos;
82
83 while (i < end_pos) {
84 c = m_Source[(unsigned int) i];
85
86 // continue building word:
87 if (c != '<') {
88 temp[templen++] = c;
89 if (templen == wxHTML_BUFLEN-1) {
90 temp[templen] = 0;
91 AddText(temp);
92 templen = 0;
93 }
94 i++;
95 }
96
97 else if (c == '<') {
98 wxHtmlTag tag(m_Source, i, end_pos, m_Cache);
99
100 if (templen) {
101 temp[templen] = 0;
102 AddText(temp);
103 templen = 0;
104 }
105 AddTag(tag);
106 if (tag.HasEnding()) i = tag.GetEndPos2();
107 else i = tag.GetBeginPos();
108 }
109 }
110
111 if (templen) { // last word of block :-(
112 temp[templen] = 0;
113 AddText(temp);
114 }
115 }
116
117
118
119 void wxHtmlParser::AddTag(const wxHtmlTag& tag)
120 {
121 wxHtmlTagHandler *h;
122 bool inner = FALSE;
123
124 h = (wxHtmlTagHandler*) m_HandlersHash.Get(tag.GetName());
125 if (h)
126 inner = h -> HandleTag(tag);
127 if (!inner) {
128 if (tag.HasEnding())
129 DoParsing(tag.GetBeginPos(), tag.GetEndPos1());
130 }
131 }
132
133
134
135 void wxHtmlParser::AddTagHandler(wxHtmlTagHandler *handler)
136 {
137 wxString s(handler -> GetSupportedTags());
138 wxStringTokenizer tokenizer(s, ", ");
139
140 while (tokenizer.HasMoreTokens())
141 m_HandlersHash.Put(tokenizer.NextToken(), handler);
142
143 if (m_HandlersList.IndexOf(handler) == wxNOT_FOUND)
144 m_HandlersList.Append(handler);
145
146 handler -> SetParser(this);
147 }
148
149
150
151 void wxHtmlParser::PushTagHandler(wxHtmlTagHandler *handler, wxString tags)
152 {
153 wxStringTokenizer tokenizer(tags, ", ");
154 wxString key;
155
156 if (m_HandlersStack == NULL) {
157 m_HandlersStack = new wxList;
158 m_HandlersStack -> DeleteContents(TRUE);
159 }
160
161 m_HandlersStack -> Insert(new wxHashTable(m_HandlersHash));
162
163 while (tokenizer.HasMoreTokens()) {
164 key = tokenizer.NextToken();
165 m_HandlersHash.Delete(key);
166 m_HandlersHash.Put(key, handler);
167 }
168 }
169
170
171
172 void wxHtmlParser::PopTagHandler()
173 {
174 wxNode *first;
175
176 if (m_HandlersStack == NULL ||
177 (first = m_HandlersStack -> GetFirst()) == NULL)
178 {
179 wxLogWarning(_("Warning: attempt to remove HTML tag handler from empty stack."));
180 return;
181 }
182 m_HandlersHash = *((wxHashTable*) first -> GetData());
183 m_HandlersStack -> DeleteNode(first);
184 }
185
186
187
188 wxHtmlParser::~wxHtmlParser()
189 {
190 if (m_HandlersStack) delete m_HandlersStack;
191 m_HandlersHash.Clear();
192 m_HandlersList.DeleteContents(TRUE);
193 m_HandlersList.Clear();
194 }
195
196
197
198 //-----------------------------------------------------------------------------
199 // wxHtmlTagHandler
200 //-----------------------------------------------------------------------------
201
202 IMPLEMENT_ABSTRACT_CLASS(wxHtmlTagHandler,wxObject)
203 #endif
204