src/html/htmltag.cpp

   1 /////////////////////////////////////////////////////////////////////////////
   2 // Name:        htmltag.cpp
   3 // Purpose:     wxHtmlTag class (represents single tag)
   4 // Author:      Vaclav Slavik
   5 // RCS-ID:      $Id$
   6 // Copyright:   (c) 1999 Vaclav Slavik
   7 // Licence:     wxWindows Licence
   8 /////////////////////////////////////////////////////////////////////////////
   9
  10
  11 #ifdef __GNUG__
  12 #pragma implementation
  13 #endif
  14
  15 #include "wx/wxprec.h"
  16
  17 #include "wx/defs.h"
  18 #if wxUSE_HTML
  19
  20 #ifdef __BORDLANDC__
  21 #pragma hdrstop
  22 #endif
  23
  24 #ifndef WXPRECOMP
  25 #include "wx/wx.h"
  26 #endif
  27
  28 #include "wx/html/htmltag.h"
  29 #include "wx/html/htmlpars.h"
  30 #include <stdio.h> // for vsscanf
  31 #include <stdarg.h>
  32
  33
  34 //-----------------------------------------------------------------------------
  35 // wxHtmlTagsCache
  36 //-----------------------------------------------------------------------------
  37
  38 struct wxHtmlCacheItem
  39 {
  40     // this is "pos" value passed to wxHtmlTag's constructor.
  41     // it is position of '<' character of the tag
  42     int Key;
  43
  44     // end positions for the tag:
  45     // end1 is '<' of ending tag,
  46     // end2 is '>' or both are
  47     // -1 if there is no ending tag for this one...
  48     // or -2 if this is ending tag  </...>
  49     int End1, End2;
  50
  51     // name of this tag
  52     wxChar *Name;
  53 };
  54
  55
  56 IMPLEMENT_CLASS(wxHtmlTagsCache,wxObject)
  57
  58 #define CACHE_INCREMENT  64
  59
  60 wxHtmlTagsCache::wxHtmlTagsCache(const wxString& source)
  61 {
  62     const wxChar *src = source.c_str();
  63     int i, tg, pos, stpos;
  64     int lng = source.Length();
  65     wxChar dummy[256];
  66
  67     m_Cache = NULL;
  68     m_CacheSize = 0;
  69     m_CachePos = 0;
  70
  71     pos = 0;
  72     while (pos < lng)
  73     {
  74         if (src[pos] == wxT('<'))   // tag found:
  75         {
  76             if (m_CacheSize % CACHE_INCREMENT == 0)
  77                 m_Cache = (wxHtmlCacheItem*) realloc(m_Cache, (m_CacheSize + CACHE_INCREMENT) * sizeof(wxHtmlCacheItem));
  78             tg = m_CacheSize++;
  79             m_Cache[tg].Key = stpos = pos++;
  80             dummy[0] = 0; i = 0;
  81             while (pos < lng &&
  82                    src[pos] != wxT('>') &&
  83                    src[pos] != wxT(' ') && src[pos] != wxT('\r') &&
  84                    src[pos] != wxT('\n') && src[pos] != wxT('\t'))
  85             {
  86                 dummy[i] = src[pos++];
  87                 if ((dummy[i] >= wxT('a')) && (dummy[i] <= wxT('z'))) dummy[i] -= (wxT('a') - wxT('A'));
  88                 i++;
  89             }
  90             dummy[i] = 0;
  91             m_Cache[tg].Name = new wxChar[i+1];
  92             memcpy(m_Cache[tg].Name, dummy, (i+1)*sizeof(wxChar));
  93
  94             while (pos < lng && src[pos] != wxT('>')) pos++;
  95
  96             if (src[stpos+1] == wxT('/')) // ending tag:
  97             {
  98                 m_Cache[tg].End1 = m_Cache[tg].End2 = -2;
  99                 // find matching begin tag:
 100                 for (i = tg; i >= 0; i--)
 101                     if ((m_Cache[i].End1 == -1) && (wxStrcmp(m_Cache[i].Name, dummy+1) == 0))
 102                     {
 103                         m_Cache[i].End1 = stpos;
 104                         m_Cache[i].End2 = pos + 1;
 105                         break;
 106                     }
 107             }
 108             else
 109             {
 110                 m_Cache[tg].End1 = m_Cache[tg].End2 = -1;
 111             }
 112         }
 113
 114         pos++;
 115     }
 116
 117     // ok, we're done, now we'll free .Name members of cache - we don't need it anymore:
 118     for (i = 0; i < m_CacheSize; i++)
 119     {
 120         delete[] m_Cache[i].Name;
 121         m_Cache[i].Name = NULL;
 122     }
 123 }
 124
 125 void wxHtmlTagsCache::QueryTag(int at, int* end1, int* end2)
 126 {
 127     if (m_Cache == NULL) return;
 128     if (m_Cache[m_CachePos].Key != at)
 129     {
 130         int delta = (at < m_Cache[m_CachePos].Key) ? -1 : 1;
 131         do
 132         {
 133             m_CachePos += delta;
 134         }
 135         while (m_Cache[m_CachePos].Key != at);
 136     }
 137     *end1 = m_Cache[m_CachePos].End1;
 138     *end2 = m_Cache[m_CachePos].End2;
 139 }
 140
 141
 142
 143
 144 //-----------------------------------------------------------------------------
 145 // wxHtmlTag
 146 //-----------------------------------------------------------------------------
 147
 148 IMPLEMENT_CLASS(wxHtmlTag,wxObject)
 149
 150 wxHtmlTag::wxHtmlTag(const wxString& source, int pos, int end_pos,
 151                      wxHtmlTagsCache *cache,
 152                      wxHtmlEntitiesParser *entParser) : wxObject()
 153 {
 154     int i;
 155     wxChar c;
 156
 157     // fill-in name, params and begin pos:
 158     i = pos+1;
 159     if (source[i] == wxT('/'))
 160         { m_Ending = TRUE; i++; }
 161     else
 162         m_Ending = FALSE;
 163
 164     // find tag's name and convert it to uppercase:
 165     while ((i < end_pos) &&
 166            ((c = source[i++]) != wxT(' ') && c != wxT('\r') &&
 167              c != wxT('\n') && c != wxT('\t') &&
 168              c != wxT('>')))
 169     {
 170         if ((c >= wxT('a')) && (c <= wxT('z')))
 171             c -= (wxT('a') - wxT('A'));
 172         m_Name << c;
 173     }
 174
 175     // if the tag has parameters, read them and "normalize" them,
 176     // i.e. convert to uppercase, replace whitespaces by spaces and
 177     // remove whitespaces around '=':
 178     if (source[i-1] != wxT('>'))
 179     {
 180         #define IS_WHITE(c) (c == wxT(' ') || c == wxT('\r') || \
 181                              c == wxT('\n') || c == wxT('\t'))
 182         wxString pname, pvalue;
 183         wxChar quote;
 184         enum
 185         {
 186             ST_BEFORE_NAME = 1,
 187             ST_NAME,
 188             ST_BEFORE_EQ,
 189             ST_BEFORE_VALUE,
 190             ST_VALUE
 191         } state;
 192
 193         quote = 0;
 194         state = ST_BEFORE_NAME;
 195         while (i < end_pos)
 196         {
 197             c = source[i++];
 198
 199             if (c == wxT('>') && !(state == ST_VALUE && quote != 0))
 200             {
 201                 if (state == ST_BEFORE_EQ || state == ST_NAME)
 202                 {
 203                     m_ParamNames.Add(pname);
 204                     m_ParamValues.Add(wxEmptyString);
 205                 }
 206                 else if (state == ST_VALUE && quote == 0)
 207                 {
 208                     m_ParamNames.Add(pname);
 209                     m_ParamValues.Add(entParser->Parse(pvalue));
 210                 }
 211                 break;
 212             }
 213             switch (state)
 214             {
 215                 case ST_BEFORE_NAME:
 216                     if (!IS_WHITE(c))
 217                     {
 218                         pname = c;
 219                         state = ST_NAME;
 220                     }
 221                     break;
 222                 case ST_NAME:
 223                     if (IS_WHITE(c))
 224                         state = ST_BEFORE_EQ;
 225                     else if (c == wxT('='))
 226                         state = ST_BEFORE_VALUE;
 227                     else
 228                         pname << c;
 229                     break;
 230                 case ST_BEFORE_EQ:
 231                     if (c == wxT('='))
 232                         state = ST_BEFORE_VALUE;
 233                     else if (!IS_WHITE(c))
 234                     {
 235                         m_ParamNames.Add(pname);
 236                         m_ParamValues.Add(wxEmptyString);
 237                         pname = c;
 238                         state = ST_NAME;
 239                     }
 240                     break;
 241                 case ST_BEFORE_VALUE:
 242                     if (!IS_WHITE(c))
 243                     {
 244                         if (c == wxT('"') || c == wxT('\''))
 245                             quote = c, pvalue = wxEmptyString;
 246                         else
 247                             quote = 0, pvalue = c;
 248                         state = ST_VALUE;
 249                     }
 250                     break;
 251                 case ST_VALUE:
 252                     if ((quote != 0 && c == quote) ||
 253                         (quote == 0 && IS_WHITE(c)))
 254                     {
 255                         m_ParamNames.Add(pname);
 256                         if (quote == 0)
 257                         {
 258                             // VS: backward compatibility, no real reason,
 259                             //     but wxHTML code relies on this... :(
 260                             pvalue.MakeUpper();
 261                         }
 262                         m_ParamValues.Add(entParser->Parse(pvalue));
 263                         state = ST_BEFORE_NAME;
 264                     }
 265                     else
 266                         pvalue << c;
 267                     break;
 268             }
 269         }
 270
 271         #undef IS_WHITE
 272    }
 273    m_Begin = i;
 274
 275    cache->QueryTag(pos, &m_End1, &m_End2);
 276    if (m_End1 > end_pos) m_End1 = end_pos;
 277    if (m_End2 > end_pos) m_End2 = end_pos;
 278 }
 279
 280 bool wxHtmlTag::HasParam(const wxString& par) const
 281 {
 282     return (m_ParamNames.Index(par, FALSE) != wxNOT_FOUND);
 283 }
 284
 285 wxString wxHtmlTag::GetParam(const wxString& par, bool with_commas) const
 286 {
 287     int index = m_ParamNames.Index(par, FALSE);
 288     if (index == wxNOT_FOUND)
 289         return wxEmptyString;
 290     if (with_commas)
 291     {
 292         // VS: backward compatibility, seems to be never used by wxHTML...
 293         wxString s;
 294         s << wxT('"') << m_ParamValues[index] << wxT('"');
 295         return s;
 296     }
 297     else
 298         return m_ParamValues[index];
 299 }
 300
 301 int wxHtmlTag::ScanParam(const wxString& par, wxChar *format, void *param) const
 302 {
 303     wxString parval = GetParam(par);
 304     return wxSscanf(parval, format, param);
 305 }
 306
 307 wxString wxHtmlTag::GetAllParams() const
 308 {
 309     // VS: this function is for backward compatiblity only,
 310     //     never used by wxHTML
 311     wxString s;
 312     size_t cnt = m_ParamNames.GetCount();
 313     for (size_t i = 0; i < cnt; i++)
 314     {
 315         s << m_ParamNames[i];
 316         s << wxT('=');
 317         if (m_ParamValues[i].Find(wxT('"')) != wxNOT_FOUND)
 318             s << wxT('\'') << m_ParamValues[i] << wxT('\'');
 319         else
 320             s << wxT('"') << m_ParamValues[i] << wxT('"');
 321     }
 322     return s;
 323 }
 324
 325 #endif