]> git.saurik.com Git - wxWidgets.git/blame - docs/latex/wx/regex.tex
Applied patch [ 581139 ] Misc wxCmdLineParser changes/fixes
[wxWidgets.git] / docs / latex / wx / regex.tex
CommitLineData
11ec1f16
VZ
1%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
2%% Name: regex.tex
3%% Purpose: wxRegEx documentation
4%% Author: Vadim Zeitlin
5%% Modified by:
6%% Created: 14.07.01
7%% RCS-ID: $Id$
8%% Copyright: (c) 2001 Vadim Zeitlin
9%% License: wxWindows license
10%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
11
12\section{\class{wxRegEx}}\label{wxregex}
13
14wxRegEx represents a regular expression. The regular expressions syntax
15supported is the POSIX one. Both basic and extended regular expressions are
16supported but, unlike POSIX C API, the extended ones are used by default.
17
18This class provides support for regular expressions matching and also
19replacement. It is built on top of either the system library (if it has support
20for POSIX regular expressions - which is the case of the most modern Unices) or
21uses the built in Henry Spencer's library. In the latter case you need to abide
22by the terms of its copyright:
23
24\begin{verbatim}
25Copyright 1992, 1993, 1994, 1997 Henry Spencer. All rights reserved.
26This software is not subject to any license of the American Telephone
27and Telegraph Company or of the Regents of the University of California.
28
29Permission is granted to anyone to use this software for any purpose on
30any computer system, and to alter it and redistribute it, subject
31to the following restrictions:
32
331. The author is not responsible for the consequences of use of this
34 software, no matter how awful, even if they arise from flaws in it.
35
362. The origin of this software must not be misrepresented, either by
37 explicit claim or by omission. Since few users ever read sources,
38 credits must appear in the documentation.
39
403. Altered versions must be plainly marked as such, and must not be
41 misrepresented as being the original software. Since few users
42 ever read sources, credits must appear in the documentation.
43
444. This notice may not be removed or altered.
45\end{verbatim}
46
47\wxheading{Derived from}
48
49No base class
50
51\wxheading{Data structures}
52
53Flags for regex compilation to be used with \helpref{Compile()}{wxregexcompile}:
5ef298b3 54
11ec1f16
VZ
55\begin{verbatim}
56enum
57{
58 // use extended regex syntax (default)
a43e748a 59 wxRE_EXTENDED = 0,
11ec1f16
VZ
60
61 // use basic RE syntax
a43e748a 62 wxRE_BASIC = 2,
11ec1f16
VZ
63
64 // ignore case in match
a43e748a 65 wxRE_ICASE = 4,
11ec1f16
VZ
66
67 // only check match, don't set back references
a43e748a 68 wxRE_NOSUB = 8,
11ec1f16
VZ
69
70 // if not set, treat '\n' as an ordinary character, otherwise it is
71 // special: it is not matched by '.' and '^' and '$' always match
a43e748a
GT
72 // after/before it regardless of the setting of wxRE_NOT[BE]OL
73 wxRE_NEWLINE = 16,
11ec1f16
VZ
74
75 // default flags
a43e748a 76 wxRE_DEFAULT = wxRE_EXTENDED
11ec1f16
VZ
77}
78\end{verbatim}
79
80Flags for regex matching to be used with \helpref{Matches()}{wxregexmatches}.
81
82These flags are mainly useful when doing several matches in a long string
7af3ca16 83to prevent erroneous matches for {\tt '\textasciicircum'} and {\tt '\$'}:
5ef298b3 84
11ec1f16
VZ
85\begin{verbatim}
86enum
87{
88 // '^' doesn't match at the start of line
a43e748a 89 wxRE_NOTBOL = 32,
11ec1f16
VZ
90
91 // '$' doesn't match at the end of line
a43e748a 92 wxRE_NOTEOL = 64
11ec1f16
VZ
93}
94\end{verbatim}
95
5ef298b3
VZ
96\wxheading{Examples}
97
98A bad example of processing some text containing email addresses (the example
99is bad because the real email addresses can have more complicated form than
100{\tt user@host.net}):
101
102\begin{verbatim}
103wxString text;
104...
105wxRegEx reEmail = "([^@]+)@([[:alnum:].-_].)+([[:alnum:]]+)";
106if ( reEmail.Matches(text) )
107{
108 wxString text = reEmail.GetMatch(email);
109 wxString username = reEmail.GetMatch(email, 1);
110 if ( reEmail.GetMatch(email, 3) == "com" ) // .com TLD?
111 {
112 ...
113 }
114}
115
116// or we could do this to hide the email address
117size_t count = reEmail.ReplaceAll(text, "HIDDEN@\\2\\3");
118printf("text now contains %u hidden addresses", count);
119\end{verbatim}
120
11ec1f16
VZ
121\latexignore{\rtfignore{\wxheading{Members}}}
122
123\membersection{wxRegEx::wxRegEx}\label{wxregexwxregex}
124
125\func{}{wxRegEx}{\void}
126
127Default ctor: use \helpref{Compile()}{wxregexcompile} later.
128
11ec1f16
VZ
129\func{}{wxRegEx}{\param{const wxString\& }{expr}, \param{int }{flags = wxRE\_DEFAULT}}
130
131Create and compile the regular expression, use
132\helpref{IsValid}{wxregexisvalid} to test for compilation errors.
133
134\membersection{wxRegEx::\destruct{wxRegEx}}\label{wxregexdtor}
135
136\func{}{\destruct{wxRegEx}}{\void}
137
138dtor not virtual, don't derive from this class
139
140\membersection{wxRegEx::Compile}\label{wxregexcompile}
141
142\func{bool}{Compile}{\param{const wxString\& }{pattern}, \param{int }{flags = wxRE\_DEFAULT}}
143
5ef298b3 144Compile the string into regular expression, return {\tt TRUE} if ok or {\tt FALSE}
11ec1f16
VZ
145if string has a syntax error.
146
147\membersection{wxRegEx::IsValid}\label{wxregexisvalid}
148
149\constfunc{bool}{IsValid}{\void}
150
151Return {\tt TRUE} if this is a valid compiled regular expression, {\tt FALSE}
152otherwise.
153
154\membersection{wxRegEx::GetMatch}\label{wxregexgetmatch}
155
156\constfunc{bool}{GetMatch}{\param{size\_t* }{start}, \param{size\_t* }{len}, \param{size\_t }{index = 0}}
157
158Get the start index and the length of the match of the expression
159(if {\it index} is $0$) or a bracketed subexpression ({\it index} different
160from $0$).
161
162May only be called after successful call to \helpref{Matches()}{wxregexmatches}
163and only if {\tt wxRE\_NOSUB} was {\bf not} used in
164\helpref{Compile()}{wxregexcompile}.
165
166Returns {\tt FALSE} if no match or if an error occured.
167
168\constfunc{wxString}{GetMatch}{\param{const wxString\& }{text}, \param{size\_t }{index = 0}}
169
170Returns the part of string corresponding to the match where {\it index} is
171interpreted as above. Empty string is returned if match failed
172
173May only be called after successful call to \helpref{Matches()}{wxregexmatches}
174and only if {\tt wxRE\_NOSUB} was {\bf not} used in
175\helpref{Compile()}{wxregexcompile}.
176
177\membersection{wxRegEx::Matches}\label{wxregexmatches}
178
179\constfunc{bool}{Matches}{\param{const wxChar* }{text}, \param{int }{flags = 0}}
180
181Matches the precompiled regular expression against the string {\it text},
182returns {\tt TRUE} if matches and {\tt FALSE} otherwise.
183
184Flags may be combination of {\tt wxRE\_NOTBOL} and {\tt wxRE\_NOTEOL}.
185
186May only be called after successful call to \helpref{Compile()}{wxregexcompile}.
187
188\membersection{wxRegEx::Replace}\label{wxregexreplace}
189
190\constfunc{int}{Replace}{\param{wxString* }{text}, \param{const wxString\& }{replacement}, \param{size\_t }{maxMatches = 0}}
191
192Replaces the current regular expression in the string pointed to by
193{\it text}, with the text in {\it replacement} and return number of matches
194replaced (maybe $0$ if none found) or $-1$ on error.
195
6465d401 196The replacement text may contain back references {\tt $\backslash$number} which will be
11ec1f16 197replaced with the value of the corresponding subexpression in the
6465d401 198pattern match. {\tt $\backslash$0} corresponds to the entire match and {\tt \&} is a
11ec1f16
VZ
199synonym for it. Backslash may be used to quote itself or {\tt \&} character.
200
201{\it maxMatches} may be used to limit the number of replacements made, setting
2edb0bde 202it to $1$, for example, will only replace first occurrence (if any) of the
11ec1f16
VZ
203pattern in the text while default value of $0$ means replace all.
204
205\membersection{wxRegEx::ReplaceAll}\label{wxregexreplaceall}
206
207\constfunc{int}{ReplaceAll}{\param{wxString* }{text}, \param{const wxString\& }{replacement}}
208
2edb0bde 209Replace all occurrences: this is actually a synonym for
11ec1f16
VZ
210\helpref{Replace()}{wxregexreplace}.
211
212\wxheading{See also}
213
214\helpref{ReplaceFirst}{wxregexreplacefirst}
215
216\membersection{wxRegEx::ReplaceFirst}\label{wxregexreplacefirst}
217
218\constfunc{int}{ReplaceFirst}{\param{wxString* }{text}, \param{const wxString\& }{replacement}}
219
2edb0bde 220Replace the first occurrence.
11ec1f16
VZ
221
222\wxheading{See also}
223
224\helpref{Replace}{wxregexreplace}
225