* debian/rules:

[apt.git] / apt-pkg / contrib / strutl.cc
diff --git a/apt-pkg/contrib/strutl.cc b/apt-pkg/contrib/strutl.cc

index 2913fbf44e42f74bf8104cb5b97051816c0940d7..c7d63ce8a58f069e55e05f920b5c003d9519f127 100644 (file)
--- a/apt-pkg/contrib/strutl.cc
+++ b/apt-pkg/contrib/strutl.cc
@@ -198,7 +198,8 @@ bool ParseQuoteWord(const char *&String,string &Res)
     char *I;
     for (I = Buffer; I < Buffer + sizeof(Buffer) && Start != C; I++)
     {
-      if (*Start == '%' && Start + 2 < C)
+      if (*Start == '%' && Start + 2 < C &&
+         isxdigit(Start[1]) && isxdigit(Start[2]))
        {
          Tmp[0] = Start[1];
          Tmp[1] = Start[2];
@@ -273,7 +274,8 @@ string QuoteString(const string &Str, const char *Bad)
     for (string::const_iterator I = Str.begin(); I != Str.end(); I++)
     {
        if (strchr(Bad,*I) != 0 || isprint(*I) == 0 || 
-         *I <= 0x20 || *I >= 0x7F)
+         *I == 0x25 || // percent '%' char
+         *I <= 0x20 || *I >= 0x7F) // control chars
        {
          char Buf[10];
          sprintf(Buf,"%%%02x",(int)*I);
@@ -289,11 +291,17 @@ string QuoteString(const string &Str, const char *Bad)
  // ---------------------------------------------------------------------
  /* This undoes QuoteString */
  string DeQuoteString(const string &Str)
+{
+   return DeQuoteString(Str.begin(),Str.end());
+}
+string DeQuoteString(string::const_iterator const &begin,
+                       string::const_iterator const &end)
  {
     string Res;
-   for (string::const_iterator I = Str.begin(); I != Str.end(); I++)
+   for (string::const_iterator I = begin; I != end; I++)
     {
-      if (*I == '%' && I + 2 < Str.end())
+      if (*I == '%' && I + 2 < end &&
+         isxdigit(I[1]) && isxdigit(I[2]))
        {
          char Tmp[3];
          Tmp[0] = I[1];
@@ -566,7 +574,7 @@ int stringcmp(string::const_iterator A,string::const_iterator AEnd,
  int stringcasecmp(const char *A,const char *AEnd,const char *B,const char *BEnd)
  {
     for (; A != AEnd && B != BEnd; A++, B++)
-      if (toupper(*A) != toupper(*B))
+      if (tolower_ascii(*A) != tolower_ascii(*B))
          break;
  
     if (A == AEnd && B == BEnd)
@@ -575,7 +583,7 @@ int stringcasecmp(const char *A,const char *AEnd,const char *B,const char *BEnd)
        return 1;
     if (B == BEnd)
        return -1;
-   if (toupper(*A) < toupper(*B))
+   if (tolower_ascii(*A) < tolower_ascii(*B))
        return -1;
     return 1;
  }
@@ -584,7 +592,7 @@ int stringcasecmp(string::const_iterator A,string::const_iterator AEnd,
                   const char *B,const char *BEnd)
  {
     for (; A != AEnd && B != BEnd; A++, B++)
-      if (toupper(*A) != toupper(*B))
+      if (tolower_ascii(*A) != tolower_ascii(*B))
          break;
  
     if (A == AEnd && B == BEnd)
@@ -593,7 +601,7 @@ int stringcasecmp(string::const_iterator A,string::const_iterator AEnd,
        return 1;
     if (B == BEnd)
        return -1;
-   if (toupper(*A) < toupper(*B))
+   if (tolower_ascii(*A) < tolower_ascii(*B))
        return -1;
     return 1;
  }
@@ -601,7 +609,7 @@ int stringcasecmp(string::const_iterator A,string::const_iterator AEnd,
                   string::const_iterator B,string::const_iterator BEnd)
  {
     for (; A != AEnd && B != BEnd; A++, B++)
-      if (toupper(*A) != toupper(*B))
+      if (tolower_ascii(*A) != tolower_ascii(*B))
          break;
  
     if (A == AEnd && B == BEnd)
@@ -610,7 +618,7 @@ int stringcasecmp(string::const_iterator A,string::const_iterator AEnd,
        return 1;
     if (B == BEnd)
        return -1;
-   if (toupper(*A) < toupper(*B))
+   if (tolower_ascii(*A) < tolower_ascii(*B))
        return -1;
     return 1;
  }
@@ -789,28 +797,28 @@ bool ReadMessages(int Fd, vector<string> &List)
  // MonthConv - Converts a month string into a number                   /*{{{*/
  // ---------------------------------------------------------------------
  /* This was lifted from the boa webserver which lifted it from 'wn-v1.07'
-   Made it a bit more robust with a few touppers though. */
+   Made it a bit more robust with a few tolower_ascii though. */
  static int MonthConv(char *Month)
  {
-   switch (toupper(*Month)) 
+   switch (tolower_ascii(*Month)) 
     {
-      case 'A':
-      return toupper(Month[1]) == 'P'?3:7;
-      case 'D':
+      case 'a':
+      return tolower_ascii(Month[1]) == 'p'?3:7;
+      case 'd':
        return 11;
-      case 'F':
+      case 'f':
        return 1;
-      case 'J':
-      if (toupper(Month[1]) == 'A')
+      case 'j':
+      if (tolower_ascii(Month[1]) == 'a')
          return 0;
-      return toupper(Month[2]) == 'N'?5:6;
-      case 'M':
-      return toupper(Month[2]) == 'R'?2:4;
-      case 'N':
+      return tolower_ascii(Month[2]) == 'n'?5:6;
+      case 'm':
+      return tolower_ascii(Month[2]) == 'r'?2:4;
+      case 'n':
        return 10;
-      case 'O':
+      case 'o':
        return 9;
-      case 'S':
+      case 's':
        return 8;
  
        // Pretend it is January..
@@ -1000,6 +1008,24 @@ bool TokSplitString(char Tok,char *Input,char **List,
     return true;
  }
                                                                         /*}}}*/
+// VectorizeString - Split a string up into a vector of strings                /*{{{*/
+// ---------------------------------------------------------------------
+/* This can be used to split a given string up into a vector, so the
+   propose is the same as in the method above and this one is a bit slower
+   also, but the advantage is that we have an iteratable vector */
+vector<string> VectorizeString(string const &haystack, char const &split)
+{
+   string::const_iterator start = haystack.begin();
+   string::const_iterator end = start;
+   vector<string> exploded;
+   do {
+      for (; end != haystack.end() && *end != split; ++end);
+      exploded.push_back(string(start, end));
+      start = end + 1;
+   } while (end != haystack.end() && (++end) != haystack.end());
+   return exploded;
+}
+                                                                       /*}}}*/
  // RegexChoice - Simple regex list/list matcher                                /*{{{*/
  // ---------------------------------------------------------------------
  /* */
@@ -1115,10 +1141,13 @@ char *safe_snprintf(char *Buffer,char *End,const char *Format,...)
  
  // tolower_ascii - tolower() function that ignores the locale          /*{{{*/
  // ---------------------------------------------------------------------
-/* */
-int tolower_ascii(int c)
+/* This little function is the most called method we have and tries
+   therefore to do the absolut minimum - and is noteable faster than
+   standard tolower/toupper and as a bonus avoids problems with different
+   locales - we only operate on ascii chars anyway. */
+int tolower_ascii(int const c)
  {
-   if (c >= 'A' and c <= 'Z')
+   if (c >= 'A' && c <= 'Z')
        return c + 32;
     return c;
  }
@@ -1217,9 +1246,10 @@ void URI::CopyFrom(const string &U)
     else
     {
        Host.assign(At+1,SingleSlash);
-      User.assign(FirstColon,SecondColon);
+      // username and password must be encoded (RFC 3986)
+      User.assign(DeQuoteString(FirstColon,SecondColon));
        if (SecondColon < At)
-        Password.assign(SecondColon+1,At);
+        Password.assign(DeQuoteString(SecondColon+1,At));
     }   
     
     // Now we parse the RFC 2732 [] hostnames.
@@ -1323,3 +1353,15 @@ string URI::SiteOnly(const string &URI)
     return U;
  }
                                                                         /*}}}*/
+// URI::NoUserPassword - Return the schema, site and path for the URI  /*{{{*/
+// ---------------------------------------------------------------------
+/* */
+string URI::NoUserPassword(const string &URI)
+{
+   ::URI U(URI);
+   U.User.clear();
+   U.Password.clear();
+   U.Port = 0;
+   return U;
+}
+                                                                       /*}}}*/