]> git.saurik.com Git - wxWidgets.git/blame - src/xml/xml.cpp
don't leak memory if exceptions are thrown during a new wxDocument creation
[wxWidgets.git] / src / xml / xml.cpp
CommitLineData
27b0c286 1/////////////////////////////////////////////////////////////////////////////
40989e46 2// Name: src/xml/xml.cpp
27b0c286
VS
3// Purpose: wxXmlDocument - XML parser & data holder class
4// Author: Vaclav Slavik
5// Created: 2000/03/05
6// RCS-ID: $Id$
7// Copyright: (c) 2000 Vaclav Slavik
65571936 8// Licence: wxWindows licence
27b0c286
VS
9/////////////////////////////////////////////////////////////////////////////
10
27b0c286
VS
11// For compilers that support precompilation, includes "wx.h".
12#include "wx/wxprec.h"
13
14#ifdef __BORLANDC__
15 #pragma hdrstop
16#endif
17
27b0c286
VS
18#if wxUSE_XML
19
40989e46
WS
20#include "wx/xml/xml.h"
21
88a7a4e1
WS
22#ifndef WX_PRECOMP
23 #include "wx/intl.h"
e4db172a 24 #include "wx/log.h"
670f9935 25 #include "wx/app.h"
88a7a4e1
WS
26#endif
27
27b0c286
VS
28#include "wx/wfstream.h"
29#include "wx/datstrm.h"
30#include "wx/zstream.h"
27b0c286 31#include "wx/strconv.h"
664e1314 32#include "wx/scopedptr.h"
27b0c286
VS
33
34#include "expat.h" // from Expat
35
34fdf762 36// DLL options compatibility check:
34fdf762
VS
37WX_CHECK_BUILD_OPTIONS("wxXML")
38
4c43dd90
JS
39
40IMPLEMENT_CLASS(wxXmlDocument, wxObject)
41
42
538f3830 43// a private utility used by wxXML
352d9b89 44static bool wxIsWhiteOnly(const wxString& buf);
538f3830 45
4c43dd90 46
27b0c286
VS
47//-----------------------------------------------------------------------------
48// wxXmlNode
49//-----------------------------------------------------------------------------
50
51wxXmlNode::wxXmlNode(wxXmlNode *parent,wxXmlNodeType type,
52 const wxString& name, const wxString& content,
6e26d6b7 53 wxXmlAttribute *attrs, wxXmlNode *next, int lineNo)
27b0c286 54 : m_type(type), m_name(name), m_content(content),
288b6107 55 m_attrs(attrs), m_parent(parent),
6e26d6b7
VS
56 m_children(NULL), m_next(next),
57 m_lineNo(lineNo)
27b0c286
VS
58{
59 if (m_parent)
60 {
61 if (m_parent->m_children)
62 {
63 m_next = m_parent->m_children;
64 m_parent->m_children = this;
65 }
66 else
67 m_parent->m_children = this;
68 }
69}
70
71wxXmlNode::wxXmlNode(wxXmlNodeType type, const wxString& name,
6e26d6b7
VS
72 const wxString& content,
73 int lineNo)
27b0c286 74 : m_type(type), m_name(name), m_content(content),
288b6107 75 m_attrs(NULL), m_parent(NULL),
6e26d6b7
VS
76 m_children(NULL), m_next(NULL),
77 m_lineNo(lineNo)
27b0c286
VS
78{}
79
80wxXmlNode::wxXmlNode(const wxXmlNode& node)
81{
82 m_next = NULL;
83 m_parent = NULL;
84 DoCopy(node);
85}
86
87wxXmlNode::~wxXmlNode()
88{
89 wxXmlNode *c, *c2;
90 for (c = m_children; c; c = c2)
91 {
92 c2 = c->m_next;
93 delete c;
94 }
95
288b6107
VS
96 wxXmlAttribute *p, *p2;
97 for (p = m_attrs; p; p = p2)
27b0c286
VS
98 {
99 p2 = p->GetNext();
100 delete p;
101 }
102}
103
104wxXmlNode& wxXmlNode::operator=(const wxXmlNode& node)
105{
288b6107 106 wxDELETE(m_attrs);
27b0c286
VS
107 wxDELETE(m_children);
108 DoCopy(node);
109 return *this;
110}
111
112void wxXmlNode::DoCopy(const wxXmlNode& node)
113{
114 m_type = node.m_type;
115 m_name = node.m_name;
116 m_content = node.m_content;
6e26d6b7 117 m_lineNo = node.m_lineNo;
27b0c286
VS
118 m_children = NULL;
119
120 wxXmlNode *n = node.m_children;
121 while (n)
122 {
123 AddChild(new wxXmlNode(*n));
124 n = n->GetNext();
125 }
126
288b6107
VS
127 m_attrs = NULL;
128 wxXmlAttribute *p = node.m_attrs;
27b0c286
VS
129 while (p)
130 {
288b6107 131 AddAttribute(p->GetName(), p->GetValue());
27b0c286
VS
132 p = p->GetNext();
133 }
134}
135
288b6107 136bool wxXmlNode::HasAttribute(const wxString& attrName) const
27b0c286 137{
288b6107 138 wxXmlAttribute *attr = GetAttributes();
27b0c286 139
288b6107 140 while (attr)
27b0c286 141 {
288b6107
VS
142 if (attr->GetName() == attrName) return true;
143 attr = attr->GetNext();
27b0c286
VS
144 }
145
759f7272 146 return false;
27b0c286
VS
147}
148
288b6107 149bool wxXmlNode::GetAttribute(const wxString& attrName, wxString *value) const
27b0c286 150{
cc24bf91
VS
151 wxCHECK_MSG( value, false, "value argument must not be NULL" );
152
288b6107 153 wxXmlAttribute *attr = GetAttributes();
27b0c286 154
288b6107 155 while (attr)
27b0c286 156 {
288b6107 157 if (attr->GetName() == attrName)
27b0c286 158 {
288b6107 159 *value = attr->GetValue();
759f7272 160 return true;
27b0c286 161 }
288b6107 162 attr = attr->GetNext();
27b0c286
VS
163 }
164
759f7272 165 return false;
27b0c286
VS
166}
167
288b6107 168wxString wxXmlNode::GetAttribute(const wxString& attrName, const wxString& defaultVal) const
27b0c286
VS
169{
170 wxString tmp;
288b6107 171 if (GetAttribute(attrName, &tmp))
27b0c286 172 return tmp;
0e2710a6
DS
173
174 return defaultVal;
27b0c286
VS
175}
176
177void wxXmlNode::AddChild(wxXmlNode *child)
178{
179 if (m_children == NULL)
180 m_children = child;
181 else
182 {
183 wxXmlNode *ch = m_children;
184 while (ch->m_next) ch = ch->m_next;
185 ch->m_next = child;
186 }
187 child->m_next = NULL;
188 child->m_parent = this;
189}
190
5e05df3c
VS
191// inserts a new node in front of 'followingNode'
192bool wxXmlNode::InsertChild(wxXmlNode *child, wxXmlNode *followingNode)
27b0c286 193{
5e05df3c
VS
194 wxCHECK_MSG( child, false, "cannot insert a NULL node!" );
195 wxCHECK_MSG( child->m_parent == NULL, false, "node already has a parent" );
196 wxCHECK_MSG( child->m_next == NULL, false, "node already has m_next" );
197 wxCHECK_MSG( followingNode == NULL || followingNode->GetParent() == this,
198 false,
199 "wxXmlNode::InsertChild - followingNode has incorrect parent" );
200
201 // this is for backward compatibility, NULL was allowed here thanks to
202 // the confusion about followingNode's meaning
203 if ( followingNode == NULL )
204 followingNode = m_children;
205
206 if ( m_children == followingNode )
fa6a8373 207 {
fa6a8373
RR
208 child->m_next = m_children;
209 m_children = child;
fa6a8373 210 }
27b0c286
VS
211 else
212 {
213 wxXmlNode *ch = m_children;
5e05df3c
VS
214 while ( ch && ch->m_next != followingNode )
215 ch = ch->m_next;
216 if ( !ch )
217 {
218 wxFAIL_MSG( "followingNode has this node as parent, but couldn't be found among children" );
219 return false;
220 }
221
222 child->m_next = followingNode;
27b0c286
VS
223 ch->m_next = child;
224 }
225
226 child->m_parent = this;
fa6a8373 227 return true;
27b0c286
VS
228}
229
43a302f2
VS
230// inserts a new node right after 'precedingNode'
231bool wxXmlNode::InsertChildAfter(wxXmlNode *child, wxXmlNode *precedingNode)
232{
233 wxCHECK_MSG( child, false, "cannot insert a NULL node!" );
234 wxCHECK_MSG( child->m_parent == NULL, false, "node already has a parent" );
235 wxCHECK_MSG( child->m_next == NULL, false, "node already has m_next" );
236 wxCHECK_MSG( precedingNode == NULL || precedingNode->m_parent == this, false,
237 "precedingNode has wrong parent" );
238
239 if ( precedingNode )
240 {
241 child->m_next = precedingNode->m_next;
242 precedingNode->m_next = child;
243 }
244 else // precedingNode == NULL
245 {
246 wxCHECK_MSG( m_children == NULL, false,
247 "NULL precedingNode only makes sense when there are no children" );
248
249 child->m_next = m_children;
250 m_children = child;
251 }
252
253 child->m_parent = this;
254 return true;
255}
256
27b0c286
VS
257bool wxXmlNode::RemoveChild(wxXmlNode *child)
258{
259 if (m_children == NULL)
759f7272 260 return false;
27b0c286
VS
261 else if (m_children == child)
262 {
263 m_children = child->m_next;
264 child->m_parent = NULL;
265 child->m_next = NULL;
759f7272 266 return true;
27b0c286
VS
267 }
268 else
269 {
270 wxXmlNode *ch = m_children;
271 while (ch->m_next)
272 {
273 if (ch->m_next == child)
274 {
275 ch->m_next = child->m_next;
276 child->m_parent = NULL;
277 child->m_next = NULL;
759f7272 278 return true;
27b0c286
VS
279 }
280 ch = ch->m_next;
281 }
759f7272 282 return false;
27b0c286
VS
283 }
284}
285
e13ce4a3
VZ
286void wxXmlNode::AddAttribute(const wxString& name, const wxString& value)
287{
288 AddProperty(name, value);
289}
290
291void wxXmlNode::AddAttribute(wxXmlAttribute *attr)
292{
293 AddProperty(attr);
294}
295
296bool wxXmlNode::DeleteAttribute(const wxString& name)
297{
298 return DeleteProperty(name);
299}
300
27b0c286
VS
301void wxXmlNode::AddProperty(const wxString& name, const wxString& value)
302{
288b6107 303 AddProperty(new wxXmlAttribute(name, value, NULL));
27b0c286
VS
304}
305
288b6107 306void wxXmlNode::AddProperty(wxXmlAttribute *attr)
27b0c286 307{
288b6107
VS
308 if (m_attrs == NULL)
309 m_attrs = attr;
27b0c286
VS
310 else
311 {
288b6107 312 wxXmlAttribute *p = m_attrs;
27b0c286 313 while (p->GetNext()) p = p->GetNext();
288b6107 314 p->SetNext(attr);
27b0c286
VS
315 }
316}
317
318bool wxXmlNode::DeleteProperty(const wxString& name)
319{
288b6107 320 wxXmlAttribute *attr;
27b0c286 321
288b6107 322 if (m_attrs == NULL)
759f7272 323 return false;
27b0c286 324
288b6107 325 else if (m_attrs->GetName() == name)
27b0c286 326 {
288b6107
VS
327 attr = m_attrs;
328 m_attrs = attr->GetNext();
329 attr->SetNext(NULL);
330 delete attr;
759f7272 331 return true;
27b0c286
VS
332 }
333
334 else
335 {
288b6107 336 wxXmlAttribute *p = m_attrs;
27b0c286
VS
337 while (p->GetNext())
338 {
339 if (p->GetNext()->GetName() == name)
340 {
288b6107
VS
341 attr = p->GetNext();
342 p->SetNext(attr->GetNext());
343 attr->SetNext(NULL);
344 delete attr;
759f7272 345 return true;
27b0c286
VS
346 }
347 p = p->GetNext();
348 }
759f7272 349 return false;
27b0c286
VS
350 }
351}
352
4c43dd90
JS
353wxString wxXmlNode::GetNodeContent() const
354{
355 wxXmlNode *n = GetChildren();
356
357 while (n)
358 {
359 if (n->GetType() == wxXML_TEXT_NODE ||
360 n->GetType() == wxXML_CDATA_SECTION_NODE)
361 return n->GetContent();
362 n = n->GetNext();
363 }
364 return wxEmptyString;
365}
366
538f3830
VS
367int wxXmlNode::GetDepth(wxXmlNode *grandparent) const
368{
369 const wxXmlNode *n = this;
370 int ret = -1;
371
372 do
373 {
374 ret++;
375 n = n->GetParent();
376 if (n == grandparent)
377 return ret;
378
379 } while (n);
380
381 return wxNOT_FOUND;
382}
383
384bool wxXmlNode::IsWhitespaceOnly() const
385{
386 return wxIsWhiteOnly(m_content);
387}
388
27b0c286
VS
389
390
391//-----------------------------------------------------------------------------
392// wxXmlDocument
393//-----------------------------------------------------------------------------
394
395wxXmlDocument::wxXmlDocument()
e767076e 396 : m_version(wxS("1.0")), m_fileEncoding(wxS("utf-8")), m_root(NULL)
27b0c286
VS
397{
398#if !wxUSE_UNICODE
e767076e 399 m_encoding = wxS("UTF-8");
27b0c286
VS
400#endif
401}
402
403wxXmlDocument::wxXmlDocument(const wxString& filename, const wxString& encoding)
d0468e8c 404 :wxObject(), m_root(NULL)
27b0c286
VS
405{
406 if ( !Load(filename, encoding) )
407 {
408 wxDELETE(m_root);
409 }
410}
411
412wxXmlDocument::wxXmlDocument(wxInputStream& stream, const wxString& encoding)
d0468e8c 413 :wxObject(), m_root(NULL)
27b0c286
VS
414{
415 if ( !Load(stream, encoding) )
416 {
417 wxDELETE(m_root);
418 }
419}
420
421wxXmlDocument::wxXmlDocument(const wxXmlDocument& doc)
d0468e8c 422 :wxObject()
27b0c286
VS
423{
424 DoCopy(doc);
425}
426
427wxXmlDocument& wxXmlDocument::operator=(const wxXmlDocument& doc)
428{
429 wxDELETE(m_root);
430 DoCopy(doc);
431 return *this;
432}
433
434void wxXmlDocument::DoCopy(const wxXmlDocument& doc)
435{
436 m_version = doc.m_version;
437#if !wxUSE_UNICODE
438 m_encoding = doc.m_encoding;
439#endif
440 m_fileEncoding = doc.m_fileEncoding;
e8da6b7c
RR
441
442 if (doc.m_root)
443 m_root = new wxXmlNode(*doc.m_root);
444 else
445 m_root = NULL;
27b0c286
VS
446}
447
538f3830 448bool wxXmlDocument::Load(const wxString& filename, const wxString& encoding, int flags)
27b0c286
VS
449{
450 wxFileInputStream stream(filename);
97757cee
VZ
451 if (!stream.Ok())
452 return false;
538f3830 453 return Load(stream, encoding, flags);
27b0c286
VS
454}
455
538f3830 456bool wxXmlDocument::Save(const wxString& filename, int indentstep) const
27b0c286
VS
457{
458 wxFileOutputStream stream(filename);
97757cee
VZ
459 if (!stream.Ok())
460 return false;
538f3830 461 return Save(stream, indentstep);
27b0c286
VS
462}
463
464
465
466//-----------------------------------------------------------------------------
467// wxXmlDocument loading routines
468//-----------------------------------------------------------------------------
469
ddae497f
VZ
470// converts Expat-produced string in UTF-8 into wxString using the specified
471// conv or keep in UTF-8 if conv is NULL
472static wxString CharToString(wxMBConv *conv,
b04edcaf 473 const char *s, size_t len = wxString::npos)
27b0c286 474{
b04edcaf 475#if !wxUSE_UNICODE
27b0c286
VS
476 if ( conv )
477 {
ddae497f
VZ
478 // there can be no embedded NULs in this string so we don't need the
479 // output length, it will be NUL-terminated
480 const wxWCharBuffer wbuf(
6df6e35a 481 wxConvUTF8.cMB2WC(s, len == wxString::npos ? wxNO_LEN : len, NULL));
ddae497f 482
da452b9e 483 return wxString(wbuf, *conv);
27b0c286 484 }
b04edcaf
VS
485 // else: the string is wanted in UTF-8
486#endif // !wxUSE_UNICODE
487
488 wxUnusedVar(conv);
cc209a51 489 return wxString::FromUTF8Unchecked(s, len);
27b0c286
VS
490}
491
538f3830 492// returns true if the given string contains only whitespaces
352d9b89 493bool wxIsWhiteOnly(const wxString& buf)
538f3830 494{
352d9b89
VS
495 for ( wxString::const_iterator i = buf.begin(); i != buf.end(); ++i )
496 {
497 wxChar c = *i;
e767076e 498 if ( c != wxS(' ') && c != wxS('\t') && c != wxS('\n') && c != wxS('\r'))
538f3830 499 return false;
352d9b89 500 }
538f3830
VS
501 return true;
502}
503
504
27b0c286
VS
505struct wxXmlParsingContext
506{
43a302f2
VS
507 wxXmlParsingContext()
508 : conv(NULL),
509 root(NULL),
510 node(NULL),
511 lastChild(NULL),
512 lastAsText(NULL),
513 removeWhiteOnlyNodes(false)
514 {}
515
6e26d6b7 516 XML_Parser parser;
27b0c286
VS
517 wxMBConv *conv;
518 wxXmlNode *root;
43a302f2
VS
519 wxXmlNode *node; // the node being parsed
520 wxXmlNode *lastChild; // the last child of "node"
521 wxXmlNode *lastAsText; // the last _text_ child of "node"
27b0c286
VS
522 wxString encoding;
523 wxString version;
538f3830 524 bool removeWhiteOnlyNodes;
27b0c286
VS
525};
526
43a302f2
VS
527// checks that ctx->lastChild is in consistent state
528#define ASSERT_LAST_CHILD_OK(ctx) \
529 wxASSERT( ctx->lastChild == NULL || \
530 ctx->lastChild->GetNext() == NULL ); \
531 wxASSERT( ctx->lastChild == NULL || \
532 ctx->lastChild->GetParent() == ctx->node )
533
865bb325 534extern "C" {
27b0c286
VS
535static void StartElementHnd(void *userData, const char *name, const char **atts)
536{
537 wxXmlParsingContext *ctx = (wxXmlParsingContext*)userData;
6e26d6b7
VS
538 wxXmlNode *node = new wxXmlNode(wxXML_ELEMENT_NODE,
539 CharToString(ctx->conv, name),
540 wxEmptyString,
541 XML_GetCurrentLineNumber(ctx->parser));
27b0c286 542 const char **a = atts;
6e26d6b7 543
43a302f2 544 // add node attributes
27b0c286
VS
545 while (*a)
546 {
288b6107 547 node->AddAttribute(CharToString(ctx->conv, a[0]), CharToString(ctx->conv, a[1]));
27b0c286
VS
548 a += 2;
549 }
43a302f2 550
27b0c286 551 if (ctx->root == NULL)
43a302f2 552 {
27b0c286 553 ctx->root = node;
43a302f2 554 }
27b0c286 555 else
43a302f2
VS
556 {
557 ASSERT_LAST_CHILD_OK(ctx);
558 ctx->node->InsertChildAfter(node, ctx->lastChild);
559 }
560
27b0c286 561 ctx->lastAsText = NULL;
43a302f2
VS
562 ctx->lastChild = NULL; // our new node "node" has no children yet
563
564 ctx->node = node;
27b0c286
VS
565}
566
567static void EndElementHnd(void *userData, const char* WXUNUSED(name))
568{
569 wxXmlParsingContext *ctx = (wxXmlParsingContext*)userData;
570
43a302f2
VS
571 // we're exiting the last children of ctx->node->GetParent() and going
572 // back one level up, so current value of ctx->node points to the last
573 // child of ctx->node->GetParent()
574 ctx->lastChild = ctx->node;
575
27b0c286
VS
576 ctx->node = ctx->node->GetParent();
577 ctx->lastAsText = NULL;
578}
579
580static void TextHnd(void *userData, const char *s, int len)
581{
582 wxXmlParsingContext *ctx = (wxXmlParsingContext*)userData;
538f3830 583 wxString str = CharToString(ctx->conv, s, len);
27b0c286
VS
584
585 if (ctx->lastAsText)
586 {
d6cb1287 587 ctx->lastAsText->SetContent(ctx->lastAsText->GetContent() + str);
27b0c286
VS
588 }
589 else
590 {
538f3830
VS
591 bool whiteOnly = false;
592 if (ctx->removeWhiteOnlyNodes)
593 whiteOnly = wxIsWhiteOnly(str);
594
27b0c286
VS
595 if (!whiteOnly)
596 {
43a302f2 597 wxXmlNode *textnode =
e767076e 598 new wxXmlNode(wxXML_TEXT_NODE, wxS("text"), str,
6e26d6b7 599 XML_GetCurrentLineNumber(ctx->parser));
43a302f2
VS
600
601 ASSERT_LAST_CHILD_OK(ctx);
602 ctx->node->InsertChildAfter(textnode, ctx->lastChild);
603 ctx->lastChild= ctx->lastAsText = textnode;
27b0c286
VS
604 }
605 }
27b0c286
VS
606}
607
a01cbf0a
RR
608static void StartCdataHnd(void *userData)
609{
610 wxXmlParsingContext *ctx = (wxXmlParsingContext*)userData;
611
43a302f2 612 wxXmlNode *textnode =
e767076e 613 new wxXmlNode(wxXML_CDATA_SECTION_NODE, wxS("cdata"), wxS(""),
6e26d6b7 614 XML_GetCurrentLineNumber(ctx->parser));
43a302f2
VS
615
616 ASSERT_LAST_CHILD_OK(ctx);
617 ctx->node->InsertChildAfter(textnode, ctx->lastChild);
618 ctx->lastChild= ctx->lastAsText = textnode;
a01cbf0a 619}
a01cbf0a 620
27b0c286
VS
621static void CommentHnd(void *userData, const char *data)
622{
623 wxXmlParsingContext *ctx = (wxXmlParsingContext*)userData;
624
625 if (ctx->node)
626 {
43a302f2 627 wxXmlNode *commentnode =
6e26d6b7 628 new wxXmlNode(wxXML_COMMENT_NODE,
e767076e 629 wxS("comment"), CharToString(ctx->conv, data),
43a302f2
VS
630 XML_GetCurrentLineNumber(ctx->parser));
631
632 ASSERT_LAST_CHILD_OK(ctx);
633 ctx->node->InsertChildAfter(commentnode, ctx->lastChild);
634 ctx->lastChild = commentnode;
27b0c286 635 }
43a302f2
VS
636 //else: ctx->node == NULL happens if there is a comment before
637 // the root element. We current don't have a way to represent
638 // these in wxXmlDocument (FIXME).
639
27b0c286
VS
640 ctx->lastAsText = NULL;
641}
642
643static void DefaultHnd(void *userData, const char *s, int len)
644{
645 // XML header:
646 if (len > 6 && memcmp(s, "<?xml ", 6) == 0)
647 {
648 wxXmlParsingContext *ctx = (wxXmlParsingContext*)userData;
649
650 wxString buf = CharToString(ctx->conv, s, (size_t)len);
651 int pos;
e767076e 652 pos = buf.Find(wxS("encoding="));
27b0c286
VS
653 if (pos != wxNOT_FOUND)
654 ctx->encoding = buf.Mid(pos + 10).BeforeFirst(buf[(size_t)pos+9]);
e767076e 655 pos = buf.Find(wxS("version="));
27b0c286
VS
656 if (pos != wxNOT_FOUND)
657 ctx->version = buf.Mid(pos + 9).BeforeFirst(buf[(size_t)pos+8]);
658 }
659}
660
661static int UnknownEncodingHnd(void * WXUNUSED(encodingHandlerData),
662 const XML_Char *name, XML_Encoding *info)
663{
664 // We must build conversion table for expat. The easiest way to do so
665 // is to let wxCSConv convert as string containing all characters to
666 // wide character representation:
86501081 667 wxCSConv conv(name);
27b0c286
VS
668 char mbBuf[2];
669 wchar_t wcBuf[10];
670 size_t i;
671
672 mbBuf[1] = 0;
673 info->map[0] = 0;
674 for (i = 0; i < 255; i++)
675 {
676 mbBuf[0] = (char)(i+1);
677 if (conv.MB2WC(wcBuf, mbBuf, 2) == (size_t)-1)
678 {
679 // invalid/undefined byte in the encoding:
680 info->map[i+1] = -1;
681 }
682 info->map[i+1] = (int)wcBuf[0];
683 }
42841dfc 684
27b0c286
VS
685 info->data = NULL;
686 info->convert = NULL;
687 info->release = NULL;
688
689 return 1;
690}
26296ac9
VS
691
692} // extern "C"
27b0c286 693
538f3830 694bool wxXmlDocument::Load(wxInputStream& stream, const wxString& encoding, int flags)
27b0c286
VS
695{
696#if wxUSE_UNICODE
697 (void)encoding;
698#else
699 m_encoding = encoding;
700#endif
701
702 const size_t BUFSIZE = 1024;
703 char buf[BUFSIZE];
704 wxXmlParsingContext ctx;
705 bool done;
706 XML_Parser parser = XML_ParserCreate(NULL);
707
e767076e 708 ctx.encoding = wxS("UTF-8"); // default in absence of encoding=""
27b0c286
VS
709 ctx.conv = NULL;
710#if !wxUSE_UNICODE
e767076e 711 if ( encoding.CmpNoCase(wxS("UTF-8")) != 0 )
27b0c286
VS
712 ctx.conv = new wxCSConv(encoding);
713#endif
538f3830 714 ctx.removeWhiteOnlyNodes = (flags & wxXMLDOC_KEEP_WHITESPACE_NODES) == 0;
6e26d6b7 715 ctx.parser = parser;
27b0c286
VS
716
717 XML_SetUserData(parser, (void*)&ctx);
718 XML_SetElementHandler(parser, StartElementHnd, EndElementHnd);
719 XML_SetCharacterDataHandler(parser, TextHnd);
d6cb1287 720 XML_SetStartCdataSectionHandler(parser, StartCdataHnd);
27b0c286
VS
721 XML_SetCommentHandler(parser, CommentHnd);
722 XML_SetDefaultHandler(parser, DefaultHnd);
723 XML_SetUnknownEncodingHandler(parser, UnknownEncodingHnd, NULL);
724
725 bool ok = true;
726 do
727 {
728 size_t len = stream.Read(buf, BUFSIZE).LastRead();
729 done = (len < BUFSIZE);
730 if (!XML_Parse(parser, buf, len, done))
731 {
6a8fb6bd
VS
732 wxString error(XML_ErrorString(XML_GetErrorCode(parser)),
733 *wxConvCurrent);
27b0c286 734 wxLogError(_("XML parsing error: '%s' at line %d"),
6a8fb6bd 735 error.c_str(),
27b0c286
VS
736 XML_GetCurrentLineNumber(parser));
737 ok = false;
738 break;
739 }
740 } while (!done);
741
742 if (ok)
743 {
759f7272 744 if (!ctx.version.empty())
6a8fb6bd 745 SetVersion(ctx.version);
759f7272 746 if (!ctx.encoding.empty())
6a8fb6bd 747 SetFileEncoding(ctx.encoding);
27b0c286
VS
748 SetRoot(ctx.root);
749 }
6a8fb6bd
VS
750 else
751 {
752 delete ctx.root;
753 }
27b0c286
VS
754
755 XML_ParserFree(parser);
756#if !wxUSE_UNICODE
757 if ( ctx.conv )
758 delete ctx.conv;
759#endif
760
761 return ok;
762
763}
764
765
766
767//-----------------------------------------------------------------------------
768// wxXmlDocument saving routines
769//-----------------------------------------------------------------------------
770
e767076e
VZ
771// helpers for XML generation
772namespace
773{
774
27b0c286 775// write string to output:
e767076e
VZ
776bool OutputString(wxOutputStream& stream,
777 const wxString& str,
778 wxMBConv *convMem,
779 wxMBConv *convFile)
27b0c286 780{
8dfd4fad 781 if (str.empty())
e767076e 782 return true;
8dfd4fad 783
27b0c286 784#if wxUSE_UNICODE
8dfd4fad
VZ
785 wxUnusedVar(convMem);
786
3232da9d 787 const wxWX2MBbuf buf(str.mb_str(*(convFile ? convFile : &wxConvUTF8)));
e767076e
VZ
788 if ( !buf )
789 return false;
790
791 stream.Write(buf, strlen(buf));
8dfd4fad
VZ
792#else // !wxUSE_UNICODE
793 if ( convFile && convMem )
27b0c286
VS
794 {
795 wxString str2(str.wc_str(*convMem), *convFile);
e767076e 796 stream.Write(str2.mb_str(), str2.length());
27b0c286 797 }
8dfd4fad
VZ
798 else // no conversions to do
799 {
e767076e 800 stream.Write(str.mb_str(), str.length());
8dfd4fad
VZ
801 }
802#endif // wxUSE_UNICODE/!wxUSE_UNICODE
e767076e
VZ
803
804 return stream.IsOk();
27b0c286
VS
805}
806
8dfd4fad
VZ
807// flags for OutputStringEnt()
808enum
809{
810 XML_ESCAPE_QUOTES = 1
811};
812
27b0c286
VS
813// Same as above, but create entities first.
814// Translates '<' to "&lt;", '>' to "&gt;" and '&' to "&amp;"
e767076e
VZ
815bool OutputStringEnt(wxOutputStream& stream,
816 const wxString& str,
817 wxMBConv *convMem,
818 wxMBConv *convFile,
819 int flags = 0)
820{
821 const size_t len = str.length();
822 size_t i,
823 last = 0;
27b0c286
VS
824 for (i = 0; i < len; i++)
825 {
e767076e
VZ
826 wxChar c = str.GetChar(i);
827 if (c == wxS('<') || c == wxS('>') ||
9c39f4f5 828 (c == wxS('&') && str.substr(i+1, 4) != wxS("amp;")) ||
e767076e 829 ((flags & XML_ESCAPE_QUOTES) && c == wxS('"')))
27b0c286 830 {
9c39f4f5
VZ
831 if ( !OutputString(stream, str.substr(last, i - last),
832 convMem, convFile) )
e767076e
VZ
833 return false;
834
835 const char *escaped;
836 switch ( c )
27b0c286 837 {
e767076e
VZ
838 case wxS('<'):
839 escaped = "&lt;";
27b0c286 840 break;
e767076e
VZ
841 case wxS('>'):
842 escaped = "&gt;";
27b0c286 843 break;
e767076e
VZ
844 case wxS('&'):
845 escaped = "&amp;";
27b0c286 846 break;
e767076e
VZ
847 case wxS('"'):
848 escaped = "&quot;";
8dfd4fad
VZ
849 break;
850 default:
e767076e
VZ
851 wxFAIL_MSG( "logic error in the code" );
852 return false;
27b0c286 853 }
e767076e
VZ
854
855 if ( !OutputString(stream, escaped, convMem, convFile) )
856 return false;
857
27b0c286
VS
858 last = i + 1;
859 }
860 }
e767076e 861
9c39f4f5 862 return OutputString(stream, str.substr(last, i - last), convMem, convFile);
27b0c286
VS
863}
864
e767076e
VZ
865bool OutputIndentation(wxOutputStream& stream,
866 int indent,
867 wxMBConv *convMem,
868 wxMBConv *convFile)
27b0c286 869{
e767076e
VZ
870 wxString str(wxS("\n"));
871 str += wxString(2*indent, wxS(' '));
872 return OutputString(stream, str, convMem, convFile);
27b0c286
VS
873}
874
e767076e
VZ
875bool OutputNode(wxOutputStream& stream,
876 wxXmlNode *node,
877 int indent,
878 wxMBConv *convMem,
879 wxMBConv *convFile,
880 int indentstep)
27b0c286 881{
e767076e 882 bool rc;
27b0c286
VS
883 switch (node->GetType())
884 {
eac789ff 885 case wxXML_CDATA_SECTION_NODE:
e767076e
VZ
886 rc = OutputString(stream, wxS("<![CDATA["), convMem, convFile) &&
887 OutputString(stream, node->GetContent(), convMem, convFile) &&
888 OutputString(stream, wxS("]]>"), convMem, convFile);
eac789ff 889 break;
a01cbf0a 890
27b0c286 891 case wxXML_TEXT_NODE:
e767076e 892 rc = OutputStringEnt(stream, node->GetContent(), convMem, convFile);
27b0c286
VS
893 break;
894
895 case wxXML_ELEMENT_NODE:
e767076e
VZ
896 rc = OutputString(stream, wxS("<"), convMem, convFile) &&
897 OutputString(stream, node->GetName(), convMem, convFile);
27b0c286 898
e767076e 899 if ( rc )
27b0c286 900 {
e767076e
VZ
901 for ( wxXmlAttribute *attr = node->GetAttributes();
902 attr && rc;
903 attr = attr->GetNext() )
904 {
905 rc = OutputString(stream,
906 wxS(" ") + attr->GetName() + wxS("=\""),
907 convMem, convFile) &&
908 OutputStringEnt(stream, attr->GetValue(),
909 convMem, convFile,
910 XML_ESCAPE_QUOTES) &&
911 OutputString(stream, wxS("\""), convMem, convFile);
912 }
27b0c286
VS
913 }
914
e767076e 915 if ( node->GetChildren() )
27b0c286 916 {
e767076e
VZ
917 rc = OutputString(stream, wxS(">"), convMem, convFile);
918
919 wxXmlNode *prev = NULL;
920 for ( wxXmlNode *n = node->GetChildren();
921 n && rc;
922 n = n->GetNext() )
27b0c286 923 {
e767076e
VZ
924 if ( indentstep >= 0 && n->GetType() != wxXML_TEXT_NODE )
925 {
926 rc = OutputIndentation(stream, indent + indentstep,
927 convMem, convFile);
928 }
929
930 if ( rc )
931 rc = OutputNode(stream, n, indent + indentstep,
932 convMem, convFile, indentstep);
933
27b0c286 934 prev = n;
27b0c286 935 }
e767076e
VZ
936
937 if ( rc && indentstep >= 0 &&
938 prev && prev->GetType() != wxXML_TEXT_NODE )
939 {
940 rc = OutputIndentation(stream, indent, convMem, convFile);
941 }
942
943 if ( rc )
944 {
945 rc = OutputString(stream, wxS("</"), convMem, convFile) &&
946 OutputString(stream, node->GetName(),
947 convMem, convFile) &&
948 OutputString(stream, wxS(">"), convMem, convFile);
949 }
950 }
951 else // no children, output "<foo/>"
952 {
953 rc = OutputString(stream, wxS("/>"), convMem, convFile);
27b0c286 954 }
27b0c286
VS
955 break;
956
957 case wxXML_COMMENT_NODE:
e767076e
VZ
958 rc = OutputString(stream, wxS("<!--"), convMem, convFile) &&
959 OutputString(stream, node->GetContent(), convMem, convFile) &&
960 OutputString(stream, wxS("-->"), convMem, convFile);
27b0c286
VS
961 break;
962
963 default:
e767076e
VZ
964 wxFAIL_MSG("unsupported node type");
965 rc = false;
27b0c286 966 }
e767076e
VZ
967
968 return rc;
27b0c286
VS
969}
970
e767076e
VZ
971} // anonymous namespace
972
538f3830 973bool wxXmlDocument::Save(wxOutputStream& stream, int indentstep) const
27b0c286
VS
974{
975 if ( !IsOk() )
759f7272 976 return false;
27b0c286 977
e767076e 978 wxScopedPtr<wxMBConv> convMem, convFile;
759f7272 979
27b0c286 980#if wxUSE_UNICODE
e767076e 981 convFile.reset(new wxCSConv(GetFileEncoding()));
27b0c286 982#else
8605f9c5 983 if ( GetFileEncoding().CmpNoCase(GetEncoding()) != 0 )
27b0c286 984 {
e767076e
VZ
985 convFile.reset(new wxCSConv(GetFileEncoding()));
986 convMem.reset(new wxCSConv(GetEncoding()));
8605f9c5 987 }
e767076e 988 //else: file and in-memory encodings are the same, no conversion needed
27b0c286
VS
989#endif
990
e767076e
VZ
991 return OutputString(stream,
992 wxString::Format
993 (
994 wxS("<?xml version=\"%s\" encoding=\"%s\"?>\n"),
995 GetVersion(), GetFileEncoding()
996 ),
997 convMem.get(),
998 convFile.get()) &&
999 OutputNode(stream, GetRoot(), 0,
1000 convMem.get(), convFile.get(), indentstep) &&
1001 OutputString(stream, wxS("\n"), convMem.get(), convFile.get());
27b0c286
VS
1002}
1003
1004#endif // wxUSE_XML