git.saurik.com Git - wxWidgets.git/blame_incremental

... / ...

Commit	Line	Data
	1	/////////////////////////////////////////////////////////////////////////////
	2	// Name: wx/tokenzr.h
	3	// Purpose: String tokenizer - a C++ replacement for strtok(3)
	4	// Author: Guilhem Lavaux
	5	// Modified by: (or rather rewritten by) Vadim Zeitlin
	6	// Created: 04/22/98
	7	// RCS-ID: $Id$
	8	// Copyright: (c) Guilhem Lavaux
	9	// Licence: wxWindows licence
	10	/////////////////////////////////////////////////////////////////////////////
	11
	12	#ifndef _WX_TOKENZRH
	13	#define _WX_TOKENZRH
	14
	15	#include "wx/object.h"
	16	#include "wx/string.h"
	17	#include "wx/arrstr.h"
	18
	19	// ----------------------------------------------------------------------------
	20	// constants
	21	// ----------------------------------------------------------------------------
	22
	23	// default: delimiters are usual white space characters
	24	#define wxDEFAULT_DELIMITERS (_T(" \t\r\n"))
	25
	26	// wxStringTokenizer mode flags which determine its behaviour
	27	enum wxStringTokenizerMode
	28	{
	29	wxTOKEN_INVALID = -1, // set by def ctor until SetString() is called
	30	wxTOKEN_DEFAULT, // strtok() for whitespace delims, RET_EMPTY else
	31	wxTOKEN_RET_EMPTY, // return empty token in the middle of the string
	32	wxTOKEN_RET_EMPTY_ALL, // return trailing empty tokens too
	33	wxTOKEN_RET_DELIMS, // return the delim with token (implies RET_EMPTY)
	34	wxTOKEN_STRTOK // behave exactly like strtok(3)
	35	};
	36
	37	// ----------------------------------------------------------------------------
	38	// wxStringTokenizer: replaces infamous strtok() and has some other features
	39	// ----------------------------------------------------------------------------
	40
	41	class WXDLLIMPEXP_BASE wxStringTokenizer : public wxObject
	42	{
	43	public:
	44	// ctors and initializers
	45	// default ctor, call SetString() later
	46	wxStringTokenizer() { m_mode = wxTOKEN_INVALID; }
	47	// ctor which gives us the string
	48	wxStringTokenizer(const wxString& str,
	49	const wxString& delims = wxDEFAULT_DELIMITERS,
	50	wxStringTokenizerMode mode = wxTOKEN_DEFAULT);
	51
	52	// args are same as for the non default ctor above
	53	void SetString(const wxString& str,
	54	const wxString& delims = wxDEFAULT_DELIMITERS,
	55	wxStringTokenizerMode mode = wxTOKEN_DEFAULT);
	56
	57	// reinitialize the tokenizer with the same delimiters/mode
	58	void Reinit(const wxString& str);
	59
	60	// tokens access
	61	// return the number of remaining tokens
	62	size_t CountTokens() const;
	63	// did we reach the end of the string?
	64	bool HasMoreTokens() const;
	65	// get the next token, will return empty string if !HasMoreTokens()
	66	wxString GetNextToken();
	67	// get the delimiter which terminated the token last retrieved by
	68	// GetNextToken() or NUL if there had been no tokens yet or the last
	69	// one wasn't terminated (but ran to the end of the string)
	70	wxChar GetLastDelimiter() const { return m_lastDelim; }
	71
	72	// get current tokenizer state
	73	// returns the part of the string which remains to tokenize (not the
	74	// initial string)
	75	wxString GetString() const { return wxString(m_pos, m_string.end()); }
	76
	77	// returns the current position (i.e. one index after the last
	78	// returned token or 0 if GetNextToken() has never been called) in the
	79	// original string
	80	size_t GetPosition() const { return m_pos - m_string.begin(); }
	81
	82	// misc
	83	// get the current mode - can be different from the one passed to the
	84	// ctor if it was wxTOKEN_DEFAULT
	85	wxStringTokenizerMode GetMode() const { return m_mode; }
	86	// do we return empty tokens?
	87	bool AllowEmpty() const { return m_mode != wxTOKEN_STRTOK; }
	88
	89
	90	// backwards compatibility section from now on
	91	// -------------------------------------------
	92
	93	// for compatibility only, use GetNextToken() instead
	94	wxString NextToken() { return GetNextToken(); }
	95
	96	// compatibility only, don't use
	97	void SetString(const wxString& to_tokenize,
	98	const wxString& delims,
	99	bool WXUNUSED(ret_delim))
	100	{
	101	SetString(to_tokenize, delims, wxTOKEN_RET_DELIMS);
	102	}
	103
	104	wxStringTokenizer(const wxString& to_tokenize,
	105	const wxString& delims,
	106	bool ret_delim)
	107	{
	108	SetString(to_tokenize, delims, ret_delim);
	109	}
	110
	111	protected:
	112	bool IsOk() const { return m_mode != wxTOKEN_INVALID; }
	113
	114	bool DoHasMoreTokens() const;
	115
	116	enum MoreTokensState
	117	{
	118	MoreTokens_Unknown,
	119	MoreTokens_Yes,
	120	MoreTokens_No
	121	};
	122
	123	MoreTokensState m_hasMoreTokens;
	124
	125	wxString m_string; // the string we tokenize
	126	wxString::const_iterator m_stringEnd;
	127	// FIXME-UTF8: use wxWcharBuffer
	128	wxWxCharBuffer m_delims; // all possible delimiters
	129	size_t m_delimsLen;
	130
	131	wxString::const_iterator m_pos; // the current position in m_string
	132
	133	wxStringTokenizerMode m_mode; // see wxTOKEN_XXX values
	134
	135	wxChar m_lastDelim; // delimiter after last token or '\0'
	136	};
	137
	138	// ----------------------------------------------------------------------------
	139	// convenience function which returns all tokens at once
	140	// ----------------------------------------------------------------------------
	141
	142	// the function takes the same parameters as wxStringTokenizer ctor and returns
	143	// the array containing all tokens
	144	wxArrayString WXDLLIMPEXP_BASE
	145	wxStringTokenize(const wxString& str,
	146	const wxString& delims = wxDEFAULT_DELIMITERS,
	147	wxStringTokenizerMode mode = wxTOKEN_DEFAULT);
	148
	149	#endif // _WX_TOKENZRH