]> git.saurik.com Git - wxWidgets.git/blame - interface/wx/tokenzr.h
add SetCharIncludes and SetCharExcludes utilities to wxTextValidator; use iterators...
[wxWidgets.git] / interface / wx / tokenzr.h
CommitLineData
23324ae1
FM
1/////////////////////////////////////////////////////////////////////////////
2// Name: tokenzr.h
e54c96f1 3// Purpose: interface of wxStringTokenizer
23324ae1
FM
4// Author: wxWidgets team
5// RCS-ID: $Id$
6// Licence: wxWindows license
7/////////////////////////////////////////////////////////////////////////////
8
977cf110
BP
9/**
10 The behaviour of wxStringTokenizer is governed by the
11 wxStringTokenizer::wxStringTokenizer() or wxStringTokenizer::SetString()
12 with the parameter @e mode, which may be one of the following:
13*/
14enum wxStringTokenizerMode
15{
16 wxTOKEN_INVALID = -1, ///< Invalid tokenizer mode.
17
18 /**
19 Default behaviour: wxStringTokenizer will behave in the same way as
20 @c strtok() (::wxTOKEN_STRTOK) if the delimiters string only contains
21 white space characters but, unlike the standard function, it will
22 behave like ::wxTOKEN_RET_EMPTY, returning empty tokens if this is not
23 the case. This is helpful for parsing strictly formatted data where
24 the number of fields is fixed but some of them may be empty (i.e.
25 @c TAB or comma delimited text files).
26 */
27 wxTOKEN_DEFAULT,
28
29 /**
30 In this mode, the empty tokens in the middle of the string will be returned,
31 i.e. @c "a::b:" will be tokenized in three tokens @c 'a', " and @c 'b'. Notice
32 that all trailing delimiters are ignored in this mode, not just the last one,
33 i.e. a string @c "a::b::" would still result in the same set of tokens.
34 */
35 wxTOKEN_RET_EMPTY,
36
37 /**
38 In this mode, empty trailing tokens (including the one after the last delimiter
39 character) will be returned as well. The string @c "a::b:" will be tokenized in
40 four tokens: the already mentioned ones and another empty one as the last one
41 and a string @c "a::b::" will have five tokens.
42 */
43 wxTOKEN_RET_EMPTY_ALL,
44
45 /**
46 In this mode, the delimiter character after the end of the current token (there
47 may be none if this is the last token) is returned appended to the token.
48 Otherwise, it is the same mode as ::wxTOKEN_RET_EMPTY. Notice that there is no
49 mode like this one but behaving like ::wxTOKEN_RET_EMPTY_ALL instead of
50 ::wxTOKEN_RET_EMPTY, use ::wxTOKEN_RET_EMPTY_ALL and
51 wxStringTokenizer::GetLastDelimiter() to emulate it.
52 */
53 wxTOKEN_RET_DELIMS,
54
55 /**
56 In this mode the class behaves exactly like the standard @c strtok() function:
57 the empty tokens are never returned.
58 */
59 wxTOKEN_STRTOK
60};
61
23324ae1
FM
62/**
63 @class wxStringTokenizer
7c913512 64
977cf110
BP
65 wxStringTokenizer helps you to break a string up into a number of tokens.
66 It replaces the standard C function @c strtok() and also extends it in a
23324ae1 67 number of ways.
7c913512 68
23324ae1
FM
69 To use this class, you should create a wxStringTokenizer object, give it the
70 string to tokenize and also the delimiters which separate tokens in the string
71 (by default, white space characters will be used).
7c913512 72
977cf110
BP
73 Then wxStringTokenizer::GetNextToken() may be called repeatedly until
74 wxStringTokenizer::HasMoreTokens() returns @false.
7c913512 75
23324ae1 76 For example:
7c913512 77
23324ae1 78 @code
977cf110
BP
79 wxStringTokenizer tokenizer("first:second:third:fourth", ":");
80 while ( tokenizer.HasMoreTokens() )
23324ae1 81 {
977cf110 82 wxString token = tokenizer.GetNextToken();
7c913512 83
23324ae1
FM
84 // process token here
85 }
86 @endcode
7c913512 87
23324ae1
FM
88 @library{wxbase}
89 @category{data}
7c913512 90
e54c96f1 91 @see wxStringTokenize()
23324ae1
FM
92*/
93class wxStringTokenizer : public wxObject
94{
95public:
23324ae1 96 /**
977cf110
BP
97 Default constructor. You must call SetString() before calling any other
98 methods.
23324ae1
FM
99 */
100 wxStringTokenizer();
977cf110
BP
101 /**
102 Constructor. Pass the string to tokenize, a string containing
103 delimiters, and the @a mode specifying how the string should be
104 tokenized.
105
106 @see SetString()
107 */
7c913512
FM
108 wxStringTokenizer(const wxString& str,
109 const wxString& delims = " \t\r\n",
110 wxStringTokenizerMode mode = wxTOKEN_DEFAULT);
23324ae1
FM
111
112 /**
977cf110
BP
113 Returns the number of tokens remaining in the input string. The number
114 of tokens returned by this function is decremented each time
115 GetNextToken() is called and when it reaches 0, HasMoreTokens()
116 returns @false.
23324ae1 117 */
43c48e1e 118 size_t CountTokens() const;
23324ae1
FM
119
120 /**
7c913512 121 Returns the delimiter which ended scan for the last token returned by
977cf110
BP
122 GetNextToken() or @c NUL if there had been no calls to this function
123 yet or if it returned the trailing empty token in
124 ::wxTOKEN_RET_EMPTY_ALL mode.
3c4f71cc 125
1e24c2af 126 @since 2.7.0
23324ae1 127 */
adaaa686 128 wxChar GetLastDelimiter() const;
23324ae1
FM
129
130 /**
131 Returns the next token or empty string if the end of string was reached.
132 */
adaaa686 133 wxString GetNextToken();
23324ae1
FM
134
135 /**
136 Returns the current position (i.e. one index after the last returned
137 token or 0 if GetNextToken() has never been called) in the original
138 string.
139 */
328f5751 140 size_t GetPosition() const;
23324ae1
FM
141
142 /**
143 Returns the part of the starting string without all token already extracted.
144 */
328f5751 145 wxString GetString() const;
23324ae1
FM
146
147 /**
148 Returns @true if the tokenizer has further tokens, @false if none are left.
149 */
328f5751 150 bool HasMoreTokens() const;
23324ae1
FM
151
152 /**
977cf110
BP
153 Initializes the tokenizer. Pass the string to tokenize, a string
154 containing delimiters, and the @a mode specifying how the string
155 should be tokenized.
23324ae1
FM
156 */
157 void SetString(const wxString& to_tokenize,
158 const wxString& delims = " \t\r\n",
159 wxStringTokenizerMode mode = wxTOKEN_DEFAULT);
160};