1 /////////////////////////////////////////////////////////////////////////////
2 // Name: richtextxml.cpp
3 // Purpose: XML and HTML I/O for wxRichTextCtrl
4 // Author: Julian Smart
8 // Copyright: (c) Julian Smart
9 // Licence: wxWindows licence
10 /////////////////////////////////////////////////////////////////////////////
12 // For compilers that support precompilation, includes "wx.h".
13 #include "wx/wxprec.h"
27 #include "wx/filename.h"
28 #include "wx/clipbrd.h"
29 #include "wx/wfstream.h"
30 #include "wx/sstream.h"
31 #include "wx/module.h"
32 #include "wx/txtstrm.h"
33 #include "wx/xml/xml.h"
35 #include "wx/richtext/richtextxml.h"
37 IMPLEMENT_DYNAMIC_CLASS(wxRichTextXMLHandler
, wxRichTextFileHandler
)
40 bool wxRichTextXMLHandler::LoadFile(wxRichTextBuffer
*buffer
, wxInputStream
& stream
)
47 wxXmlDocument
* xmlDoc
= new wxXmlDocument
;
50 if (!xmlDoc
->Load(stream
, wxT("ISO-8859-1")))
56 if (xmlDoc
->GetRoot() && xmlDoc
->GetRoot()->GetType() == wxXML_ELEMENT_NODE
&& xmlDoc
->GetRoot()->GetName() == wxT("richtext"))
58 wxXmlNode
* child
= xmlDoc
->GetRoot()->GetChildren();
61 if (child
->GetType() == wxXML_ELEMENT_NODE
)
63 wxString name
= child
->GetName();
64 if (name
== wxT("richtext-version"))
68 ImportXML(buffer
, child
);
71 child
= child
->GetNext();
82 buffer
->UpdateRanges();
87 /// Recursively import an object
88 bool wxRichTextXMLHandler::ImportXML(wxRichTextBuffer
* buffer
, wxXmlNode
* node
)
90 wxString name
= node
->GetName();
92 bool doneChildren
= false;
94 if (name
== wxT("paragraphlayout"))
97 else if (name
== wxT("paragraph"))
99 wxRichTextParagraph
* para
= new wxRichTextParagraph(buffer
);
100 buffer
->AppendChild(para
);
102 GetStyle(para
->GetAttributes(), node
, true);
104 wxXmlNode
* child
= node
->GetChildren();
107 wxString childName
= child
->GetName();
108 if (childName
== wxT("text"))
111 wxXmlNode
* textChild
= child
->GetChildren();
114 if (textChild
->GetType() == wxXML_TEXT_NODE
||
115 textChild
->GetType() == wxXML_CDATA_SECTION_NODE
)
117 wxString text2
= textChild
->GetContent();
119 // Strip whitespace from end
120 if (text2
.Length() > 0 && text2
[text2
.Length()-1] == wxT('\n'))
121 text2
= text2
.Mid(0, text2
.Length()-1);
123 if (text2
.Length() > 0 && text2
[0] == wxT('"'))
124 text2
= text2
.Mid(1);
125 if (text2
.Length() > 0 && text2
[text2
.Length()-1] == wxT('"'))
126 text2
= text2
.Mid(0, text2
.Length() - 1);
128 // TODO: further entity translation
129 text2
.Replace(wxT("<"), wxT("<"));
130 text2
.Replace(wxT(">"), wxT(">"));
131 text2
.Replace(wxT("&"), wxT("&"));
132 text2
.Replace(wxT("""), wxT("\""));
136 textChild
= textChild
->GetNext();
139 wxRichTextPlainText
* textObject
= new wxRichTextPlainText(text
, para
);
140 GetStyle(textObject
->GetAttributes(), child
, false);
142 para
->AppendChild(textObject
);
144 else if (childName
== wxT("image"))
146 int imageType
= wxBITMAP_TYPE_PNG
;
147 wxString value
= node
->GetPropVal(wxT("imagetype"), wxEmptyString
);
148 if (!value
.IsEmpty())
149 imageType
= wxAtoi(value
);
153 wxXmlNode
* imageChild
= child
->GetChildren();
156 wxString childName
= imageChild
->GetName();
157 if (childName
== wxT("data"))
159 wxXmlNode
* dataChild
= imageChild
->GetChildren();
162 data
= dataChild
->GetContent();
164 dataChild
= dataChild
->GetNext();
168 imageChild
= imageChild
->GetNext();
173 wxRichTextImage
* imageObj
= new wxRichTextImage(para
);
174 para
->AppendChild(imageObj
);
176 wxStringInputStream
strStream(data
);
178 imageObj
->GetImageBlock().ReadHex(strStream
, data
.Length(), imageType
);
181 child
= child
->GetNext();
189 wxXmlNode
* child
= node
->GetChildren();
192 ImportXML(buffer
, child
);
193 child
= child
->GetNext();
201 //-----------------------------------------------------------------------------
202 // xml support routines
203 //-----------------------------------------------------------------------------
205 bool wxRichTextXMLHandler::HasParam(wxXmlNode
* node
, const wxString
& param
)
207 return (GetParamNode(node
, param
) != NULL
);
210 wxXmlNode
*wxRichTextXMLHandler::GetParamNode(wxXmlNode
* node
, const wxString
& param
)
212 wxCHECK_MSG(node
, NULL
, wxT("You can't access node data before it was initialized!"));
214 wxXmlNode
*n
= node
->GetChildren();
218 if (n
->GetType() == wxXML_ELEMENT_NODE
&& n
->GetName() == param
)
226 wxString
wxRichTextXMLHandler::GetNodeContent(wxXmlNode
*node
)
229 if (n
== NULL
) return wxEmptyString
;
230 n
= n
->GetChildren();
234 if (n
->GetType() == wxXML_TEXT_NODE
||
235 n
->GetType() == wxXML_CDATA_SECTION_NODE
)
236 return n
->GetContent();
239 return wxEmptyString
;
243 wxString
wxRichTextXMLHandler::GetParamValue(wxXmlNode
*node
, const wxString
& param
)
246 return GetNodeContent(node
);
248 return GetNodeContent(GetParamNode(node
, param
));
251 wxString
wxRichTextXMLHandler::GetText(wxXmlNode
*node
, const wxString
& param
, bool WXUNUSED(translate
))
253 wxXmlNode
*parNode
= GetParamNode(node
, param
);
256 wxString
str1(GetNodeContent(parNode
));
260 // write string to output:
261 inline static void OutputString(wxOutputStream
& stream
, const wxString
& str
,
262 wxMBConv
*convMem
= NULL
, wxMBConv
*convFile
= NULL
)
264 if (str
.IsEmpty()) return;
266 const wxWX2MBbuf
buf(str
.mb_str(convFile
? *convFile
: wxConvUTF8
));
267 stream
.Write((const char*)buf
, strlen((const char*)buf
));
269 if ( convFile
== NULL
)
270 stream
.Write(str
.mb_str(), str
.Len());
273 wxString
str2(str
.wc_str(*convMem
), *convFile
);
274 stream
.Write(str2
.mb_str(), str2
.Len());
279 // Same as above, but create entities first.
280 // Translates '<' to "<", '>' to ">" and '&' to "&"
281 static void OutputStringEnt(wxOutputStream
& stream
, const wxString
& str
,
282 wxMBConv
*convMem
= NULL
, wxMBConv
*convFile
= NULL
)
290 for (i
= 0; i
< len
; i
++)
293 if (c
== wxT('<') || c
== wxT('>') || c
== wxT('"') ||
294 (c
== wxT('&') && (str
.Mid(i
+1, 4) != wxT("amp;"))))
296 OutputString(stream
, str
.Mid(last
, i
- last
), convMem
, convFile
);
300 OutputString(stream
, wxT("<"), NULL
, NULL
);
303 OutputString(stream
, wxT(">"), NULL
, NULL
);
306 OutputString(stream
, wxT("&"), NULL
, NULL
);
309 OutputString(stream
, wxT("""), NULL
, NULL
);
316 OutputString(stream
, str
.Mid(last
, i
- last
), convMem
, convFile
);
319 inline static void OutputIndentation(wxOutputStream
& stream
, int indent
)
321 wxString str
= wxT("\n");
322 for (int i
= 0; i
< indent
; i
++)
323 str
<< wxT(' ') << wxT(' ');
324 OutputString(stream
, str
, NULL
, NULL
);
327 static wxOutputStream
& operator <<(wxOutputStream
& stream
, const wxString
& s
)
329 stream
.Write(s
, s
.Length());
333 static wxOutputStream
& operator <<(wxOutputStream
& stream
, long l
)
336 str
.Printf(wxT("%ld"), l
);
337 return stream
<< str
;
340 static wxOutputStream
& operator <<(wxOutputStream
& stream
, const char c
)
343 str
.Printf(wxT("%c"), c
);
344 return stream
<< str
;
347 // Convert a colour to a 6-digit hex string
348 static wxString
ColourToHexString(const wxColour
& col
)
352 hex
+= wxDecToHex(col
.Red());
353 hex
+= wxDecToHex(col
.Green());
354 hex
+= wxDecToHex(col
.Blue());
359 // Convert 6-digit hex string to a colour
360 wxColour
HexStringToColour(const wxString
& hex
)
365 r
= wxHexToDec(hex
.Mid(0, 2));
366 g
= wxHexToDec(hex
.Mid(2, 2));
367 b
= wxHexToDec(hex
.Mid(4, 2));
369 return wxColour(r
, g
, b
);
372 bool wxRichTextXMLHandler::SaveFile(wxRichTextBuffer
*buffer
, wxOutputStream
& stream
)
377 wxString
version(wxT("1.0") ) ;
379 wxString
fileencoding(wxT("UTF-8")) ;
380 wxString
memencoding(wxT("UTF-8")) ;
382 wxString
fileencoding(wxT("ISO-8859-1")) ;
383 wxString
memencoding(wxT("ISO-8859-1")) ;
387 wxMBConv
*convMem
= NULL
, *convFile
= NULL
;
389 convFile
= new wxCSConv(fileencoding
);
391 if ( fileencoding
!= memencoding
)
393 convFile
= new wxCSConv(fileencoding
);
394 convMem
= new wxCSConv(memencoding
);
398 s
.Printf(wxT("<?xml version=\"%s\" encoding=\"%s\"?>\n"),
399 (const wxChar
*) version
, (const wxChar
*) fileencoding
);
400 OutputString(stream
, s
, NULL
, NULL
);
401 OutputString(stream
, wxT("<richtext version=\"1.0.0.0\" xmlns=\"http://www.wxwidgets.org\">") , NULL
, NULL
);
404 ExportXML(stream
, convMem
, convFile
, *buffer
, level
);
406 OutputString(stream
, wxT("\n</richtext>") , NULL
, NULL
);
407 OutputString(stream
, wxT("\n"), NULL
, NULL
);
415 /// Recursively export an object
416 bool wxRichTextXMLHandler::ExportXML(wxOutputStream
& stream
, wxMBConv
* convMem
, wxMBConv
* convFile
, wxRichTextObject
& obj
, int indent
)
419 if (obj
.IsKindOf(CLASSINFO(wxRichTextParagraphLayoutBox
)))
420 objectName
= wxT("paragraphlayout");
421 else if (obj
.IsKindOf(CLASSINFO(wxRichTextParagraph
)))
422 objectName
= wxT("paragraph");
423 else if (obj
.IsKindOf(CLASSINFO(wxRichTextPlainText
)))
424 objectName
= wxT("text");
425 else if (obj
.IsKindOf(CLASSINFO(wxRichTextImage
)))
426 objectName
= wxT("image");
428 objectName
= wxT("object");
430 if (obj
.IsKindOf(CLASSINFO(wxRichTextPlainText
)))
432 wxRichTextPlainText
& text
= (wxRichTextPlainText
&) obj
;
434 OutputIndentation(stream
, indent
);
435 stream
<< wxT("<") << objectName
;
437 wxString style
= CreateStyle(obj
.GetAttributes(), false);
439 stream
<< style
<< wxT(">");
441 wxString str
= text
.GetText();
442 if (str
.Length() > 0 && (str
[0] == wxT(' ') || str
[str
.Length()-1] == wxT(' ')))
445 OutputStringEnt(stream
, str
, convMem
, convFile
);
449 OutputStringEnt(stream
, str
, convMem
, convFile
);
451 else if (obj
.IsKindOf(CLASSINFO(wxRichTextImage
)))
453 wxRichTextImage
& imageObj
= (wxRichTextImage
&) obj
;
455 if (imageObj
.GetImage().Ok() && !imageObj
.GetImageBlock().Ok())
456 imageObj
.MakeBlock();
458 OutputIndentation(stream
, indent
);
459 stream
<< wxT("<") << objectName
;
460 if (!imageObj
.GetImageBlock().Ok())
467 stream
<< wxString::Format(wxT(" imagetype=\"%d\""), (int) imageObj
.GetImageBlock().GetImageType()) << wxT(">");
470 OutputIndentation(stream
, indent
+1);
471 stream
<< wxT("<data>");
473 imageObj
.GetImageBlock().WriteHex(stream
);
475 stream
<< wxT("</data>");
477 else if (obj
.IsKindOf(CLASSINFO(wxRichTextCompositeObject
)))
479 OutputIndentation(stream
, indent
);
480 stream
<< wxT("<") << objectName
;
483 if (objectName
== wxT("paragraph") || objectName
== wxT("paragraphlayout"))
486 wxString style
= CreateStyle(obj
.GetAttributes(), isPara
);
488 stream
<< style
<< wxT(">");
490 wxRichTextCompositeObject
& composite
= (wxRichTextCompositeObject
&) obj
;
492 for (i
= 0; i
< composite
.GetChildCount(); i
++)
494 wxRichTextObject
* child
= composite
.GetChild(i
);
495 ExportXML(stream
, convMem
, convFile
, *child
, indent
+1);
499 if (objectName
!= wxT("text"))
500 OutputIndentation(stream
, indent
);
502 stream
<< wxT("</") << objectName
<< wxT(">");
507 /// Create style parameters
508 wxString
wxRichTextXMLHandler::CreateStyle(const wxTextAttrEx
& attr
, bool isPara
)
511 if (attr
.GetTextColour().Ok())
513 str
<< wxT(" textcolor=\"#") << ColourToHexString(attr
.GetTextColour()) << wxT("\"");
515 if (attr
.GetBackgroundColour().Ok())
517 str
<< wxT(" bgcolor=\"#") << ColourToHexString(attr
.GetBackgroundColour()) << wxT("\"");
520 if (attr
.GetFont().Ok())
522 str
<< wxT(" fontsize=\"") << attr
.GetFont().GetPointSize() << wxT("\"");
523 str
<< wxT(" fontfamily=\"") << attr
.GetFont().GetFamily() << wxT("\"");
524 str
<< wxT(" fontstyle=\"") << attr
.GetFont().GetStyle() << wxT("\"");
525 str
<< wxT(" fontweight=\"") << attr
.GetFont().GetWeight() << wxT("\"");
526 str
<< wxT(" fontunderlined=\"") << (int) attr
.GetFont().GetUnderlined() << wxT("\"");
527 str
<< wxT(" fontface=\"") << attr
.GetFont().GetFaceName() << wxT("\"");
530 if (!attr
.GetCharacterStyleName().IsEmpty())
531 str
<< wxT(" charactertyle=\"") << wxString(attr
.GetCharacterStyleName()) << wxT("\"");
535 str
<< wxT(" alignment=\"") << (int) attr
.GetAlignment() << wxT("\"");
536 str
<< wxT(" leftindent=\"") << (int) attr
.GetLeftIndent() << wxT("\"");
537 str
<< wxT(" leftsubindent=\"") << (int) attr
.GetLeftSubIndent() << wxT("\"");
538 str
<< wxT(" rightindent=\"") << (int) attr
.GetRightIndent() << wxT("\"");
539 str
<< wxT(" parspacingafter=\"") << (int) attr
.GetParagraphSpacingAfter() << wxT("\"");
540 str
<< wxT(" parspacingbefore=\"") << (int) attr
.GetParagraphSpacingBefore() << wxT("\"");
541 str
<< wxT(" linespacing=\"") << (int) attr
.GetLineSpacing() << wxT("\"");
542 str
<< wxT(" bulletstyle=\"") << (int) attr
.GetBulletStyle() << wxT("\"");
543 str
<< wxT(" bulletnumber=\"") << (int) attr
.GetBulletNumber() << wxT("\"");
544 str
<< wxT(" bulletsymbol=\"") << wxString(attr
.GetBulletSymbol()) << wxT("\"");
546 if (!attr
.GetParagraphStyleName().IsEmpty())
547 str
<< wxT(" parstyle=\"") << wxString(attr
.GetParagraphStyleName()) << wxT("\"");
553 /// Get style parameters
554 bool wxRichTextXMLHandler::GetStyle(wxTextAttrEx
& attr
, wxXmlNode
* node
, bool isPara
)
556 wxString fontFacename
;
558 int fontFamily
= wxDEFAULT
;
559 int fontWeight
= wxNORMAL
;
560 int fontStyle
= wxNORMAL
;
561 bool fontUnderlined
= false;
563 fontFacename
= node
->GetPropVal(wxT("fontface"), wxEmptyString
);
565 wxString value
= node
->GetPropVal(wxT("fontfamily"), wxEmptyString
);
566 if (!value
.IsEmpty())
567 fontFamily
= wxAtoi(value
);
569 value
= node
->GetPropVal(wxT("fontstyle"), wxEmptyString
);
570 if (!value
.IsEmpty())
571 fontStyle
= wxAtoi(value
);
573 value
= node
->GetPropVal(wxT("fontsize"), wxEmptyString
);
574 if (!value
.IsEmpty())
575 fontSize
= wxAtoi(value
);
577 value
= node
->GetPropVal(wxT("fontweight"), wxEmptyString
);
578 if (!value
.IsEmpty())
579 fontWeight
= wxAtoi(value
);
581 value
= node
->GetPropVal(wxT("fontunderlined"), wxEmptyString
);
582 if (!value
.IsEmpty())
583 fontUnderlined
= wxAtoi(value
) != 0;
585 attr
.SetFont(* wxTheFontList
->FindOrCreateFont(fontSize
, fontFamily
, fontStyle
, fontWeight
, fontUnderlined
, fontFacename
));
587 value
= node
->GetPropVal(wxT("textcolor"), wxEmptyString
);
588 if (!value
.IsEmpty())
590 if (value
[0] == wxT('#'))
591 attr
.SetTextColour(HexStringToColour(value
.Mid(1)));
593 attr
.SetTextColour(value
);
596 value
= node
->GetPropVal(wxT("backgroundcolor"), wxEmptyString
);
597 if (!value
.IsEmpty())
599 if (value
[0] == wxT('#'))
600 attr
.SetBackgroundColour(HexStringToColour(value
.Mid(1)));
602 attr
.SetBackgroundColour(value
);
605 value
= node
->GetPropVal(wxT("characterstyle"), wxEmptyString
);
606 if (!value
.IsEmpty())
607 attr
.SetCharacterStyleName(value
);
609 // Set paragraph attributes
612 value
= node
->GetPropVal(wxT("alignment"), wxEmptyString
);
613 if (!value
.IsEmpty())
614 attr
.SetAlignment((wxTextAttrAlignment
) wxAtoi(value
));
616 int leftSubIndent
= 0;
618 value
= node
->GetPropVal(wxT("leftindent"), wxEmptyString
);
619 if (!value
.IsEmpty())
620 leftIndent
= wxAtoi(value
);
621 value
= node
->GetPropVal(wxT("leftsubindent"), wxEmptyString
);
622 if (!value
.IsEmpty())
623 leftSubIndent
= wxAtoi(value
);
624 attr
.SetLeftIndent(leftIndent
, leftSubIndent
);
626 value
= node
->GetPropVal(wxT("rightindent"), wxEmptyString
);
627 if (!value
.IsEmpty())
628 attr
.SetRightIndent(wxAtoi(value
));
630 value
= node
->GetPropVal(wxT("parspacingbefore"), wxEmptyString
);
631 if (!value
.IsEmpty())
632 attr
.SetParagraphSpacingBefore(wxAtoi(value
));
634 value
= node
->GetPropVal(wxT("parspacingafter"), wxEmptyString
);
635 if (!value
.IsEmpty())
636 attr
.SetParagraphSpacingAfter(wxAtoi(value
));
638 value
= node
->GetPropVal(wxT("linespacing"), wxEmptyString
);
639 if (!value
.IsEmpty())
640 attr
.SetLineSpacing(wxAtoi(value
));
642 value
= node
->GetPropVal(wxT("bulletstyle"), wxEmptyString
);
643 if (!value
.IsEmpty())
644 attr
.SetBulletStyle(wxAtoi(value
));
646 value
= node
->GetPropVal(wxT("bulletnumber"), wxEmptyString
);
647 if (!value
.IsEmpty())
648 attr
.SetBulletNumber(wxAtoi(value
));
650 value
= node
->GetPropVal(wxT("bulletsymbol"), wxEmptyString
);
651 if (!value
.IsEmpty())
652 attr
.SetBulletSymbol(value
[0]);
654 value
= node
->GetPropVal(wxT("parstyle"), wxEmptyString
);
655 if (!value
.IsEmpty())
656 attr
.SetParagraphStyleName(value
);
664 IMPLEMENT_DYNAMIC_CLASS(wxRichTextHTMLHandler
, wxRichTextFileHandler
)
666 /// Can we handle this filename (if using files)? By default, checks the extension.
667 bool wxRichTextHTMLHandler::CanHandle(const wxString
& filename
) const
669 wxString path
, file
, ext
;
670 wxSplitPath(filename
, & path
, & file
, & ext
);
672 return (ext
.Lower() == wxT("html") || ext
.Lower() == wxT("htm"));
677 bool wxRichTextHTMLHandler::LoadFile(wxRichTextBuffer
*WXUNUSED(buffer
), wxInputStream
& WXUNUSED(stream
))
683 * We need to output only _changes_ in character formatting.
686 bool wxRichTextHTMLHandler::SaveFile(wxRichTextBuffer
*buffer
, wxOutputStream
& stream
)
688 buffer
->Defragment();
690 wxTextOutputStream
str(stream
);
692 wxTextAttrEx currentParaStyle
= buffer
->GetAttributes();
693 wxTextAttrEx currentCharStyle
= buffer
->GetAttributes();
695 str
<< wxT("<html><head></head><body>\n");
697 wxRichTextObjectList::compatibility_iterator node
= buffer
->GetChildren().GetFirst();
700 wxRichTextParagraph
* para
= wxDynamicCast(node
->GetData(), wxRichTextParagraph
);
701 wxASSERT (para
!= NULL
);
705 OutputParagraphFormatting(currentParaStyle
, para
->GetAttributes(), stream
, true);
707 wxRichTextObjectList::compatibility_iterator node2
= para
->GetChildren().GetFirst();
710 wxRichTextObject
* obj
= node2
->GetData();
711 wxRichTextPlainText
* textObj
= wxDynamicCast(obj
, wxRichTextPlainText
);
712 if (textObj
&& !textObj
->IsEmpty())
714 OutputCharacterFormatting(currentCharStyle
, obj
->GetAttributes(), stream
, true);
716 str
<< textObj
->GetText();
718 OutputCharacterFormatting(currentCharStyle
, obj
->GetAttributes(), stream
, false);
721 node2
= node2
->GetNext();
724 OutputParagraphFormatting(currentParaStyle
, para
->GetAttributes(), stream
, false);
729 node
= node
->GetNext();
732 str
<< wxT("</body></html>\n");
737 /// Output character formatting
738 void wxRichTextHTMLHandler::OutputCharacterFormatting(const wxTextAttrEx
& WXUNUSED(currentStyle
), const wxTextAttrEx
& thisStyle
, wxOutputStream
& stream
, bool start
)
740 wxTextOutputStream
str(stream
);
743 bool isItalic
= false;
744 bool isUnderline
= false;
747 if (thisStyle
.GetFont().Ok())
749 if (thisStyle
.GetFont().GetWeight() == wxBOLD
)
751 if (thisStyle
.GetFont().GetStyle() == wxITALIC
)
753 if (thisStyle
.GetFont().GetUnderlined())
756 faceName
= thisStyle
.GetFont().GetFaceName();
779 /// Output paragraph formatting
780 void wxRichTextHTMLHandler::OutputParagraphFormatting(const wxTextAttrEx
& WXUNUSED(currentStyle
), const wxTextAttrEx
& thisStyle
, wxOutputStream
& stream
, bool start
)
782 // TODO: lists, indentation (using tables), fonts, right-align, ...
784 wxTextOutputStream
str(stream
);
785 bool isCentered
= false;
787 if (thisStyle
.GetAlignment() == wxTEXT_ALIGNMENT_CENTRE
)
795 str
<< wxT("<center>");
800 str
<< wxT("</center>");