]> git.saurik.com Git - apt.git/blob - apt-pkg/contrib/strutl.h
refactor EDSP classes for better internal reuse
[apt.git] / apt-pkg / contrib / strutl.h
1 // -*- mode: cpp; mode: fold -*-
2 // Description /*{{{*/
3 // $Id: strutl.h,v 1.22 2003/02/02 22:20:27 jgg Exp $
4 /* ######################################################################
5
6 String Util - These are some useful string functions
7
8 _strstrip is a function to remove whitespace from the front and end
9 of a string.
10
11 This source is placed in the Public Domain, do with it what you will
12 It was originally written by Jason Gunthorpe <jgg@gpu.srv.ualberta.ca>
13
14 ##################################################################### */
15 /*}}}*/
16 #ifndef STRUTL_H
17 #define STRUTL_H
18
19
20 #include <limits>
21 #include <string>
22 #include <cstring>
23 #include <vector>
24 #include <iostream>
25 #ifdef APT_PKG_EXPOSE_STRING_VIEW
26 #include <apt-pkg/string_view.h>
27 #endif
28 #include <time.h>
29 #include <stddef.h>
30
31 #include "macros.h"
32
33 #ifndef APT_10_CLEANER_HEADERS
34 #include <stdlib.h>
35 #endif
36 #ifndef APT_8_CLEANER_HEADERS
37 using std::string;
38 using std::vector;
39 using std::ostream;
40 #endif
41
42 namespace APT {
43 namespace String {
44 std::string Strip(const std::string &s);
45 bool Endswith(const std::string &s, const std::string &ending);
46 bool Startswith(const std::string &s, const std::string &starting);
47 }
48 }
49
50
51 bool UTF8ToCodeset(const char *codeset, const std::string &orig, std::string *dest);
52 char *_strstrip(char *String);
53 char *_strrstrip(char *String); // right strip only
54 char *_strtabexpand(char *String,size_t Len);
55 bool ParseQuoteWord(const char *&String,std::string &Res);
56 bool ParseCWord(const char *&String,std::string &Res);
57 std::string QuoteString(const std::string &Str,const char *Bad);
58 std::string DeQuoteString(const std::string &Str);
59 std::string DeQuoteString(std::string::const_iterator const &begin, std::string::const_iterator const &end);
60
61 // unescape (\0XX and \xXX) from a string
62 std::string DeEscapeString(const std::string &input);
63
64 std::string SizeToStr(double Bytes);
65 std::string TimeToStr(unsigned long Sec);
66 std::string Base64Encode(const std::string &Str);
67 std::string OutputInDepth(const unsigned long Depth, const char* Separator=" ");
68 std::string URItoFileName(const std::string &URI);
69 std::string TimeRFC1123(time_t Date);
70 /** parses time as needed by HTTP/1.1 and Debian files.
71 *
72 * HTTP/1.1 prefers dates in RFC1123 format (but the other two obsolete date formats
73 * are supported to) and e.g. Release files use the same format in Date & Valid-Until
74 * fields.
75 *
76 * Note: datetime strings need to be in UTC timezones (GMT, UTC, Z, +/-0000) to be
77 * parsed. Other timezones will be rejected as invalid. Previous implementations
78 * accepted other timezones, but treated them as UTC.
79 *
80 * @param str is the datetime string to parse
81 * @param[out] time will be the seconds since epoch of the given datetime if
82 * parsing is successful, undefined otherwise.
83 * @return \b true if parsing was successful, otherwise \b false.
84 */
85 bool RFC1123StrToTime(const char* const str,time_t &time) APT_MUSTCHECK;
86 bool FTPMDTMStrToTime(const char* const str,time_t &time) APT_MUSTCHECK;
87 APT_DEPRECATED_MSG("Use RFC1123StrToTime or FTPMDTMStrToTime as needed instead") bool StrToTime(const std::string &Val,time_t &Result);
88 std::string LookupTag(const std::string &Message,const char *Tag,const char *Default = 0);
89 int StringToBool(const std::string &Text,int Default = -1);
90 bool ReadMessages(int Fd, std::vector<std::string> &List);
91 bool StrToNum(const char *Str,unsigned long &Res,unsigned Len,unsigned Base = 0);
92 bool StrToNum(const char *Str,unsigned long long &Res,unsigned Len,unsigned Base = 0);
93 bool Base256ToNum(const char *Str,unsigned long &Res,unsigned int Len);
94 bool Base256ToNum(const char *Str,unsigned long long &Res,unsigned int Len);
95 bool Hex2Num(const std::string &Str,unsigned char *Num,unsigned int Length);
96 #ifdef APT_PKG_EXPOSE_STRING_VIEW
97 APT_HIDDEN bool Hex2Num(const APT::StringView Str,unsigned char *Num,unsigned int Length);
98 #endif
99 // input changing string split
100 bool TokSplitString(char Tok,char *Input,char **List,
101 unsigned long ListMax);
102
103 // split a given string by a char
104 std::vector<std::string> VectorizeString(std::string const &haystack, char const &split) APT_PURE;
105
106 /* \brief Return a vector of strings from string "input" where "sep"
107 * is used as the delimiter string.
108 *
109 * \param input The input string.
110 *
111 * \param sep The separator to use.
112 *
113 * \param maxsplit (optional) The maximum amount of splitting that
114 * should be done .
115 *
116 * The optional "maxsplit" argument can be used to limit the splitting,
117 * if used the string is only split on maxsplit places and the last
118 * item in the vector contains the remainder string.
119 */
120 std::vector<std::string> StringSplit(std::string const &input,
121 std::string const &sep,
122 unsigned int maxsplit=std::numeric_limits<unsigned int>::max()) APT_CONST;
123
124 void ioprintf(std::ostream &out,const char *format,...) APT_PRINTF(2);
125 void strprintf(std::string &out,const char *format,...) APT_PRINTF(2);
126 char *safe_snprintf(char *Buffer,char *End,const char *Format,...) APT_PRINTF(3);
127 bool CheckDomainList(const std::string &Host, const std::string &List);
128
129 /* Do some compat mumbo jumbo */
130 #define tolower_ascii tolower_ascii_inline
131 #define isspace_ascii isspace_ascii_inline
132
133 APT_CONST APT_HOT
134 static inline int tolower_ascii_inline(int const c)
135 {
136 return (c >= 'A' && c <= 'Z') ? c + 32 : c;
137 }
138 APT_CONST APT_HOT
139 static inline int isspace_ascii_inline(int const c)
140 {
141 // 9='\t',10='\n',11='\v',12='\f',13='\r',32=' '
142 return (c >= 9 && c <= 13) || c == ' ';
143 }
144
145 std::string StripEpoch(const std::string &VerStr);
146
147 #define APT_MKSTRCMP(name,func) \
148 inline APT_PURE int name(const char *A,const char *B) {return func(A,A+strlen(A),B,B+strlen(B));} \
149 inline APT_PURE int name(const char *A,const char *AEnd,const char *B) {return func(A,AEnd,B,B+strlen(B));} \
150 inline APT_PURE int name(const std::string& A,const char *B) {return func(A.c_str(),A.c_str()+A.length(),B,B+strlen(B));} \
151 inline APT_PURE int name(const std::string& A,const std::string& B) {return func(A.c_str(),A.c_str()+A.length(),B.c_str(),B.c_str()+B.length());} \
152 inline APT_PURE int name(const std::string& A,const char *B,const char *BEnd) {return func(A.c_str(),A.c_str()+A.length(),B,BEnd);}
153
154 #define APT_MKSTRCMP2(name,func) \
155 inline APT_PURE int name(const char *A,const char *AEnd,const char *B) {return func(A,AEnd,B,B+strlen(B));} \
156 inline APT_PURE int name(const std::string& A,const char *B) {return func(A.begin(),A.end(),B,B+strlen(B));} \
157 inline APT_PURE int name(const std::string& A,const std::string& B) {return func(A.begin(),A.end(),B.begin(),B.end());} \
158 inline APT_PURE int name(const std::string& A,const char *B,const char *BEnd) {return func(A.begin(),A.end(),B,BEnd);}
159
160 int APT_PURE stringcmp(const char *A,const char *AEnd,const char *B,const char *BEnd);
161 int APT_PURE stringcasecmp(const char *A,const char *AEnd,const char *B,const char *BEnd);
162
163 /* We assume that GCC 3 indicates that libstdc++3 is in use too. In that
164 case the definition of string::const_iterator is not the same as
165 const char * and we need these extra functions */
166 #if __GNUC__ >= 3
167 int APT_PURE stringcmp(std::string::const_iterator A,std::string::const_iterator AEnd,
168 const char *B,const char *BEnd);
169 int APT_PURE stringcmp(std::string::const_iterator A,std::string::const_iterator AEnd,
170 std::string::const_iterator B,std::string::const_iterator BEnd);
171 int APT_PURE stringcasecmp(std::string::const_iterator A,std::string::const_iterator AEnd,
172 const char *B,const char *BEnd);
173 int APT_PURE stringcasecmp(std::string::const_iterator A,std::string::const_iterator AEnd,
174 std::string::const_iterator B,std::string::const_iterator BEnd);
175
176 inline APT_PURE int stringcmp(std::string::const_iterator A,std::string::const_iterator Aend,const char *B) {return stringcmp(A,Aend,B,B+strlen(B));}
177 inline APT_PURE int stringcasecmp(std::string::const_iterator A,std::string::const_iterator Aend,const char *B) {return stringcasecmp(A,Aend,B,B+strlen(B));}
178 #endif
179
180 APT_MKSTRCMP2(stringcmp,stringcmp)
181 APT_MKSTRCMP2(stringcasecmp,stringcasecmp)
182
183 // Return the length of a NULL-terminated string array
184 size_t APT_PURE strv_length(const char **str_array);
185
186
187 inline const char *DeNull(const char *s) {return (s == 0?"(null)":s);}
188
189 class URI
190 {
191 void CopyFrom(const std::string &From);
192
193 public:
194
195 std::string Access;
196 std::string User;
197 std::string Password;
198 std::string Host;
199 std::string Path;
200 unsigned int Port;
201
202 operator std::string();
203 inline void operator =(const std::string &From) {CopyFrom(From);}
204 inline bool empty() {return Access.empty();};
205 static std::string SiteOnly(const std::string &URI);
206 static std::string ArchiveOnly(const std::string &URI);
207 static std::string NoUserPassword(const std::string &URI);
208
209 URI(std::string Path) {CopyFrom(Path);}
210 URI() : Port(0) {}
211 };
212
213 struct SubstVar
214 {
215 const char *Subst;
216 const std::string *Contents;
217 };
218 std::string SubstVar(std::string Str,const struct SubstVar *Vars);
219 std::string SubstVar(const std::string &Str,const std::string &Subst,const std::string &Contents);
220
221 struct RxChoiceList
222 {
223 void *UserData;
224 const char *Str;
225 bool Hit;
226 };
227 unsigned long RegexChoice(RxChoiceList *Rxs,const char **ListBegin,
228 const char **ListEnd);
229
230 #endif