]>
Commit | Line | Data |
---|---|---|
5526e819 | 1 | ///////////////////////////////////////////////////////////////////////////// |
69941f05 | 2 | // Name: htmlpars.cpp |
5526e819 VS |
3 | // Purpose: wxHtmlParser class (generic parser) |
4 | // Author: Vaclav Slavik | |
69941f05 | 5 | // RCS-ID: $Id$ |
5526e819 VS |
6 | // Copyright: (c) 1999 Vaclav Slavik |
7 | // Licence: wxWindows Licence | |
8 | ///////////////////////////////////////////////////////////////////////////// | |
9 | ||
10 | ||
11 | #ifdef __GNUG__ | |
12 | #pragma implementation | |
13 | #endif | |
14 | ||
3096bd2f | 15 | #include "wx/wxprec.h" |
5526e819 VS |
16 | |
17 | #include "wx/defs.h" | |
18 | #if wxUSE_HTML | |
19 | ||
20 | #ifdef __BORDLANDC__ | |
21 | #pragma hdrstop | |
22 | #endif | |
23 | ||
24 | #ifndef WXPRECOMP | |
3096bd2f | 25 | #include "wx/wx.h" |
5526e819 VS |
26 | #endif |
27 | ||
69941f05 VS |
28 | #include "wx/tokenzr.h" |
29 | #include "wx/wfstream.h" | |
30 | #include "wx/url.h" | |
31 | #include "wx/html/htmldefs.h" | |
32 | #include "wx/html/htmlpars.h" | |
5526e819 VS |
33 | |
34 | ||
35 | ||
36 | //----------------------------------------------------------------------------- | |
37 | // wxHtmlParser | |
38 | //----------------------------------------------------------------------------- | |
39 | ||
40 | IMPLEMENT_ABSTRACT_CLASS(wxHtmlParser,wxObject) | |
41 | ||
42 | ||
43 | wxObject* wxHtmlParser::Parse(const wxString& source) | |
44 | { | |
45 | wxObject *result; | |
46 | ||
47 | InitParser(source); | |
48 | DoParsing(); | |
49 | result = GetProduct(); | |
50 | DoneParser(); | |
51 | return result; | |
52 | } | |
53 | ||
54 | ||
55 | ||
56 | void wxHtmlParser::InitParser(const wxString& source) | |
57 | { | |
58 | m_Source = source; | |
59 | m_Cache = new wxHtmlTagsCache(m_Source); | |
60 | } | |
61 | ||
62 | ||
63 | ||
64 | void wxHtmlParser::DoneParser() | |
65 | { | |
66 | delete m_Cache; | |
67 | m_Cache = NULL; | |
68 | } | |
69 | ||
70 | ||
71 | ||
efba2b89 | 72 | #define wxHTML_MAX_BUFLEN 1024 |
5526e819 VS |
73 | |
74 | void wxHtmlParser::DoParsing(int begin_pos, int end_pos) | |
75 | { | |
efba2b89 | 76 | char temp[wxHTML_BUFLEN], c; |
5526e819 VS |
77 | int i; |
78 | int templen; | |
79 | ||
80 | templen = 0; | |
81 | i = begin_pos; | |
82 | ||
83 | while (i < end_pos) { | |
01dba85a | 84 | c = m_Source[(unsigned int) i]; |
5526e819 VS |
85 | |
86 | // continue building word: | |
87 | if (c != '<') { | |
88 | temp[templen++] = c; | |
efba2b89 | 89 | if (templen == wxHTML_BUFLEN-1) { |
5526e819 VS |
90 | temp[templen] = 0; |
91 | AddText(temp); | |
92 | templen = 0; | |
93 | } | |
94 | i++; | |
95 | } | |
96 | ||
97 | else if (c == '<') { | |
98 | wxHtmlTag tag(m_Source, i, end_pos, m_Cache); | |
99 | ||
100 | if (templen) { | |
101 | temp[templen] = 0; | |
102 | AddText(temp); | |
103 | templen = 0; | |
104 | } | |
105 | AddTag(tag); | |
106 | if (tag.HasEnding()) i = tag.GetEndPos2(); | |
107 | else i = tag.GetBeginPos(); | |
108 | } | |
109 | } | |
110 | ||
111 | if (templen) { // last word of block :-( | |
112 | temp[templen] = 0; | |
113 | AddText(temp); | |
114 | } | |
115 | } | |
116 | ||
117 | ||
118 | ||
119 | void wxHtmlParser::AddTag(const wxHtmlTag& tag) | |
120 | { | |
121 | wxHtmlTagHandler *h; | |
122 | bool inner = FALSE; | |
123 | ||
124 | h = (wxHtmlTagHandler*) m_HandlersHash.Get(tag.GetName()); | |
125 | if (h) | |
126 | inner = h -> HandleTag(tag); | |
127 | if (!inner) { | |
128 | if (tag.HasEnding()) | |
129 | DoParsing(tag.GetBeginPos(), tag.GetEndPos1()); | |
130 | } | |
131 | } | |
132 | ||
133 | ||
134 | ||
135 | void wxHtmlParser::AddTagHandler(wxHtmlTagHandler *handler) | |
136 | { | |
137 | wxString s(handler -> GetSupportedTags()); | |
138 | wxStringTokenizer tokenizer(s, ", "); | |
139 | ||
5526e819 | 140 | while (tokenizer.HasMoreTokens()) |
5526e819 VS |
141 | m_HandlersHash.Put(tokenizer.NextToken(), handler); |
142 | ||
143 | if (m_HandlersList.IndexOf(handler) == wxNOT_FOUND) | |
144 | m_HandlersList.Append(handler); | |
145 | ||
146 | handler -> SetParser(this); | |
147 | } | |
148 | ||
149 | ||
150 | ||
a7a4d01b VS |
151 | void wxHtmlParser::PushTagHandler(wxHtmlTagHandler *handler, wxString tags) |
152 | { | |
153 | wxStringTokenizer tokenizer(tags, ", "); | |
154 | wxString key; | |
155 | ||
156 | if (m_HandlersStack == NULL) { | |
157 | m_HandlersStack = new wxList; | |
158 | m_HandlersStack -> DeleteContents(TRUE); | |
159 | } | |
160 | ||
161 | m_HandlersStack -> Insert(new wxHashTable(m_HandlersHash)); | |
162 | ||
163 | while (tokenizer.HasMoreTokens()) { | |
164 | key = tokenizer.NextToken(); | |
165 | m_HandlersHash.Delete(key); | |
166 | m_HandlersHash.Put(key, handler); | |
167 | } | |
168 | } | |
169 | ||
170 | ||
171 | ||
172 | void wxHtmlParser::PopTagHandler() | |
173 | { | |
174 | wxNode *first; | |
175 | ||
176 | if (m_HandlersStack == NULL || (first = m_HandlersStack -> GetFirst()) == NULL) return; | |
177 | m_HandlersHash = *((wxHashTable*) first -> GetData()); | |
178 | m_HandlersStack -> DeleteNode(first); | |
179 | } | |
180 | ||
181 | ||
182 | ||
5526e819 VS |
183 | wxHtmlParser::~wxHtmlParser() |
184 | { | |
a7a4d01b | 185 | if (m_HandlersStack) delete m_HandlersStack; |
5526e819 VS |
186 | m_HandlersHash.Clear(); |
187 | m_HandlersList.DeleteContents(TRUE); | |
188 | m_HandlersList.Clear(); | |
189 | } | |
190 | ||
191 | ||
192 | ||
193 | //----------------------------------------------------------------------------- | |
194 | // wxHtmlTagHandler | |
195 | //----------------------------------------------------------------------------- | |
196 | ||
197 | IMPLEMENT_ABSTRACT_CLASS(wxHtmlTagHandler,wxObject) | |
223d09f6 | 198 | #endif |
5526e819 | 199 |