]> git.saurik.com Git - wxWidgets.git/blame - docs/latex/wx/htparser.tex
wxPython doc updates
[wxWidgets.git] / docs / latex / wx / htparser.tex
CommitLineData
704a4b75
VS
1%
2% automatically generated by HelpGen from
3% htmlparser.tex at 14/Mar/99 20:13:37
4%
5
704a4b75
VS
6\section{\class{wxHtmlParser}}\label{wxhtmlparser}
7
22d6efa8 8This class handles the {\bf generic} parsing of HTML document: it scans
704a4b75
VS
9the document and divide it into blocks of tags (where one block
10consists of begining and ending tag and of text between these
22d6efa8 11two tags).
704a4b75
VS
12
13It is independent from wxHtmlWindow and can be used as stand-alone parser
14(Julian Smart's idea of speech-only HTML viewer or wget-like utility -
3660fc40 15see InetGet sample for example).
704a4b75
VS
16
17It uses system of tag handlers to parse the HTML document. Tag handlers
3660fc40 18are not staticaly shared by all instances but are created for each
704a4b75
VS
19wxHtmlParser instance. The reason is that the handler may contain
20document-specific temporary data used during parsing (e.g. complicated
22d6efa8 21structures like tables).
704a4b75 22
22d6efa8 23Typically the user calls only the \helpref{Parse}{wxhtmlparserparse} method.
704a4b75
VS
24
25\wxheading{Derived from}
26
27wxObject
28
29\wxheading{See also}
30
31\helpref{Cells Overview}{cells},
32\helpref{Tag Handlers Overview}{handlers},
33\helpref{wxHtmlTag}{wxhtmltag}
34
35\latexignore{\rtfignore{\wxheading{Members}}}
36
704a4b75
VS
37\membersection{wxHtmlParser::wxHtmlParser}\label{wxhtmlparserwxhtmlparser}
38
39\func{}{wxHtmlParser}{\void}
40
3660fc40 41Constructor.
704a4b75 42
559fe022 43\membersection{wxHtmlParser::AddTag}\label{wxhtmlparseraddtag}
704a4b75 44
559fe022 45\func{void}{AddTag}{\param{const wxHtmlTag\& }{tag}}
704a4b75 46
559fe022 47This may (and may not) be overwriten in derived class.
704a4b75 48
559fe022
VS
49This method is called each time new tag is about to be added.
50{\it tag} contains information about the tag. (See \helpref{wxHtmlTag}{wxhtmltag}
51for details.)
704a4b75 52
559fe022
VS
53Default (wxHtmlParser) behaviour is this:
54First it finds a handler capable of handling this tag and then it calls
55handler's HandleTag method.
704a4b75 56
559fe022 57\membersection{wxHtmlParser::AddTagHandler}\label{wxhtmlparseraddtaghandler}
704a4b75 58
559fe022 59\func{virtual void}{AddTagHandler}{\param{wxHtmlTagHandler }{*handler}}
704a4b75 60
559fe022
VS
61Adds handler to the internal list (\& hash table) of handlers. This
62method should not be called directly by user but rather by derived class'
63constructor.
704a4b75 64
559fe022
VS
65This adds the handler to this {\bf instance} of wxHtmlParser, not to
66all objects of this class! (Static front-end to AddTagHandler is provided
67by wxHtmlWinParser).
704a4b75 68
559fe022 69All handlers are deleted on object deletion.
704a4b75 70
559fe022 71\membersection{wxHtmlParser::AddText}\label{wxhtmlparseraddword}
704a4b75 72
559fe022 73\func{virtual void}{AddWord}{\param{const char* }{txt}}
704a4b75 74
559fe022 75Must be overwriten in derived class.
704a4b75 76
559fe022
VS
77This method is called by \helpref{DoParsing}{wxhtmlparserdoparsing}
78each time a part of text is parsed. {\it txt} is NOT only one word, it is
79substring of input. It is not formatted or preprocessed (so white spaces are
80unmodified).
704a4b75 81
559fe022 82\membersection{wxHtmlParser::DoParsing}\label{wxhtmlparserdoparsing}
704a4b75 83
559fe022
VS
84\func{void}{DoParsing}{\param{int }{begin\_pos}, \param{int }{end\_pos}}
85
86\func{void}{DoParsing}{\void}
87
88Parses the m\_Source from begin\_pos to end\_pos-1.
89(in noparams version it parses whole m\_Source)
704a4b75 90
704a4b75
VS
91\membersection{wxHtmlParser::DoneParser}\label{wxhtmlparserdoneparser}
92
93\func{virtual void}{DoneParser}{\void}
94
95This must be called after DoParsing().
96
559fe022 97\membersection{wxHtmlParser::GetFS}\label{wxhtmlparsergetfs}
704a4b75 98
559fe022 99\constfunc{wxFileSystem*}{GetFS}{\void}
704a4b75 100
559fe022
VS
101Returns pointer to the file system. Because each tag handler has
102reference to it's parent parser it can easily request the file by
103calling
704a4b75 104
559fe022
VS
105\begin{verbatim}
106wxFSFile *f = m_Parser -> GetFS() -> OpenFile("image.jpg");
107\end{verbatim}
704a4b75
VS
108
109\membersection{wxHtmlParser::GetProduct}\label{wxhtmlparsergetproduct}
110
111\func{virtual wxObject*}{GetProduct}{\void}
112
3660fc40
RD
113Returns product of parsing. Returned value is result of parsing
114of the document. The type of this result depends on internal
704a4b75
VS
115representation in derived parser (but it must be derived from wxObject!).
116
117See wxHtmlWinParser for details.
118
704a4b75
VS
119\membersection{wxHtmlParser::GetSource}\label{wxhtmlparsergetsource}
120
121\func{wxString*}{GetSource}{\void}
122
123Returns pointer to the source being parsed.
124
704a4b75 125
559fe022 126\membersection{wxHtmlParser::InitParser}\label{wxhtmlparserinitparser}
704a4b75 127
559fe022 128\func{virtual void}{InitParser}{\param{const wxString\& }{source}}
704a4b75 129
559fe022
VS
130Setups the parser for parsing the {\it source} string. (Should be overriden
131in derived class)
704a4b75 132
559fe022 133\membersection{wxHtmlParser::Parse}\label{wxhtmlparserparse}
704a4b75 134
559fe022 135\func{wxObject*}{Parse}{\param{const wxString\& }{source}}
704a4b75 136
559fe022
VS
137Proceeds parsing of the document. This is end-user method. You can simply
138call it when you need to obtain parsed output (which is parser-specific)
704a4b75 139
559fe022 140The method does these things:
704a4b75 141
448af9a4 142\begin{enumerate}\itemsep=0pt
559fe022
VS
143\item calls \helpref{InitParser(source)}{wxhtmlparserinitparser}
144\item calls \helpref{DoParsing}{wxhtmlparserdoparsing}
145\item calls \helpref{GetProduct}{wxhtmlparsergetproduct}
146\item calls \helpref{DoneParser}{wxhtmlparserdoneparser}
147\item returns value returned by GetProduct
148\end{enumerate}
704a4b75 149
559fe022
VS
150You shouldn't use InitParser, DoParsing, GetProduct or DoneParser directly.
151
0eb8c938
VS
152
153
154\membersection{wxHtmlParser::PushTagHandler}\label{wxhtmlparserpushtaghandler}
155
156\func{void}{PushTagHandler}{\param{wxHtmlTagHandler* }{handler}, \param{wxString }{tags}}
157
158Forces the handler to handle additional tags
159(not returned by \helpref{GetSupportedTags}{wxhtmltaghandlergetsupportedtags}).
160The handler should already be added to this parser.
161
162\wxheading{Parameters}
163
164\docparam{handler}{the handler}
165\docparam{tags}{List of tags (in same format as GetSupportedTags's return value). The parser
166will redirect these tags to {\it handler} (until call to \helpref{PopTagHandler}{wxhtmlparserpoptaghandler}). }
167
168\wxheading{Example}
169
170Imagine you want to parse following pseudo-html structure:
171
172\begin{verbatim}
173<myitems>
174 <param name="one" value="1">
175 <param name="two" value="2">
176</myitems>
177
178<execute>
179 <param program="text.exe">
180</execute>
181\end{verbatim}
182
183It is obvious that you cannot use only one tag handler for <param> tag.
184Instead you must use context-sensitive handlers for <param> inside <myitems>
185and <param> inside <execute>.
186
187This is the prefered solution:
188
189\begin{verbatim}
190TAG_HANDLER_BEGIN(MYITEM, "MYITEMS")
191 TAG_HANDLER_PROC(tag)
192 {
193 // ...something...
194
195 m_Parser -> PushTagHandler(this, "PARAM");
196 ParseInner(tag);
197 m_Parser -> PopTagHandler();
198
199 // ...something...
200 }
201TAG_HANDLER_END(MYITEM)
202\end{verbatim}
203
204
205\membersection{wxHtmlParser::PopTagHandler}\label{wxhtmlparserpoptaghandler}
206
207\func{void}{PopTagHandler}{\void}
208
209Restores parser's state before last call to
210\helpref{PushTagHandler}{wxhtmlparserpushtaghandler}.
211
212
559fe022
VS
213\membersection{wxHtmlParser::SetFS}\label{wxhtmlparsersetfs}
214
215\func{void}{SetFS}{\param{wxFileSystem }{*fs}}
216
217Sets the virtual file system that will be used to request additional
218files. (For example {\tt <IMG>} tag handler requests wxFSFile with the
219image data.)
22d6efa8 220