1 ///////////////////////////////////////////////////////////////////////////// 
   2 // Name:        src/richtext/richtexthtml.cpp 
   3 // Purpose:     HTML I/O for wxRichTextCtrl 
   4 // Author:      Julian Smart 
   8 // Copyright:   (c) Julian Smart 
   9 // Licence:     wxWindows licence 
  10 ///////////////////////////////////////////////////////////////////////////// 
  12 // For compilers that support precompilation, includes "wx.h". 
  13 #include "wx/wxprec.h" 
  21 #include "wx/richtext/richtexthtml.h" 
  22 #include "wx/richtext/richtextstyles.h" 
  27 #include "wx/filename.h" 
  28 #include "wx/wfstream.h" 
  29 #include "wx/txtstrm.h" 
  32 #include "wx/filesys.h" 
  33 #include "wx/fs_mem.h" 
  36 IMPLEMENT_DYNAMIC_CLASS(wxRichTextHTMLHandler
, wxRichTextFileHandler
) 
  38 int wxRichTextHTMLHandler::sm_fileCounter 
= 1; 
  40 wxRichTextHTMLHandler::wxRichTextHTMLHandler(const wxString
& name
, const wxString
& ext
, int type
) 
  41     : wxRichTextFileHandler(name
, ext
, type
), m_buffer(NULL
), m_font(false), m_inTable(false) 
  43     m_fontSizeMapping
.Add(8); 
  44     m_fontSizeMapping
.Add(10); 
  45     m_fontSizeMapping
.Add(13); 
  46     m_fontSizeMapping
.Add(17); 
  47     m_fontSizeMapping
.Add(22); 
  48     m_fontSizeMapping
.Add(30); 
  49     m_fontSizeMapping
.Add(100); 
  52 /// Can we handle this filename (if using files)? By default, checks the extension. 
  53 bool wxRichTextHTMLHandler::CanHandle(const wxString
& filename
) const 
  55     wxString path
, file
, ext
; 
  56     wxFileName::SplitPath(filename
, & path
, & file
, & ext
); 
  58     return (ext
.Lower() == wxT("html") || ext
.Lower() == wxT("htm")); 
  63 bool wxRichTextHTMLHandler::DoLoadFile(wxRichTextBuffer 
*WXUNUSED(buffer
), wxInputStream
& WXUNUSED(stream
)) 
  69  * We need to output only _changes_ in character formatting. 
  72 bool wxRichTextHTMLHandler::DoSaveFile(wxRichTextBuffer 
*buffer
, wxOutputStream
& stream
) 
  76     ClearTemporaryImageLocations(); 
  81     wxCSConv
* customEncoding 
= NULL
; 
  82     wxMBConv
* conv 
= NULL
; 
  83     if (!GetEncoding().IsEmpty()) 
  85         customEncoding 
= new wxCSConv(GetEncoding()); 
  86         if (!customEncoding
->IsOk()) 
  88             wxDELETE(customEncoding
); 
  92         conv 
= customEncoding
; 
  99         wxTextOutputStream 
str(stream
, wxEOL_NATIVE
, *conv
); 
 101         wxTextOutputStream 
str(stream
, wxEOL_NATIVE
); 
 104         wxRichTextAttr currentParaStyle 
= buffer
->GetAttributes(); 
 105         wxRichTextAttr currentCharStyle 
= buffer
->GetAttributes(); 
 107         if ((GetFlags() & wxRICHTEXT_HANDLER_NO_HEADER_FOOTER
) == 0) 
 108             str 
<< wxT("<html><head></head><body>\n"); 
 110         OutputFont(currentParaStyle
, str
); 
 118         wxRichTextObjectList::compatibility_iterator node 
= buffer
->GetChildren().GetFirst(); 
 121             wxRichTextParagraph
* para 
= wxDynamicCast(node
->GetData(), wxRichTextParagraph
); 
 122             wxASSERT (para 
!= NULL
); 
 126                 wxRichTextAttr 
paraStyle(para
->GetCombinedAttributes()); 
 128                 BeginParagraphFormatting(currentParaStyle
, paraStyle
, str
); 
 130                 wxRichTextObjectList::compatibility_iterator node2 
= para
->GetChildren().GetFirst(); 
 133                     wxRichTextObject
* obj 
= node2
->GetData(); 
 134                     wxRichTextPlainText
* textObj 
= wxDynamicCast(obj
, wxRichTextPlainText
); 
 135                     if (textObj 
&& !textObj
->IsEmpty()) 
 137                         wxRichTextAttr 
charStyle(para
->GetCombinedAttributes(obj
->GetAttributes())); 
 138                         BeginCharacterFormatting(currentCharStyle
, charStyle
, paraStyle
, str
); 
 140                         wxString text 
= textObj
->GetText(); 
 142                         if (charStyle
.HasTextEffects() && (charStyle
.GetTextEffects() & wxTEXT_ATTR_EFFECT_CAPITALS
)) 
 145                         wxString toReplace 
= wxRichTextLineBreakChar
; 
 146                         text
.Replace(toReplace
, wxT("<br>")); 
 150                         EndCharacterFormatting(currentCharStyle
, charStyle
, paraStyle
, str
); 
 153                     wxRichTextImage
* image 
= wxDynamicCast(obj
, wxRichTextImage
); 
 154                     if( image 
&& (!image
->IsEmpty() || image
->GetImageBlock().GetData())) 
 155                         WriteImage( image
, stream 
); 
 157                     node2 
= node2
->GetNext(); 
 160                 EndParagraphFormatting(currentParaStyle
, paraStyle
, str
); 
 164             node 
= node
->GetNext(); 
 169         str 
<< wxT("</font>"); 
 171         if ((GetFlags() & wxRICHTEXT_HANDLER_NO_HEADER_FOOTER
) == 0) 
 172             str 
<< wxT("</body></html>"); 
 179         delete customEncoding
; 
 187 void wxRichTextHTMLHandler::BeginCharacterFormatting(const wxRichTextAttr
& currentStyle
, const wxRichTextAttr
& thisStyle
, const wxRichTextAttr
& WXUNUSED(paraStyle
), wxTextOutputStream
& str
) 
 191     // Is there any change in the font properties of the item? 
 192     if (thisStyle
.GetFontFaceName() != currentStyle
.GetFontFaceName()) 
 194         wxString 
faceName(thisStyle
.GetFontFaceName()); 
 195         style 
+= wxString::Format(wxT(" face=\"%s\""), faceName
.c_str()); 
 197     if (thisStyle
.GetFontSize() != currentStyle
.GetFontSize()) 
 198         style 
+= wxString::Format(wxT(" size=\"%ld\""), PtToSize(thisStyle
.GetFontSize())); 
 200     bool bTextColourChanged 
= (thisStyle
.GetTextColour() != currentStyle
.GetTextColour()); 
 201     bool bBackgroundColourChanged 
= (thisStyle
.GetBackgroundColour() != currentStyle
.GetBackgroundColour()); 
 202     if (bTextColourChanged 
|| bBackgroundColourChanged
) 
 204         style 
+= wxT(" style=\""); 
 206         if (bTextColourChanged
) 
 208             wxString 
color(thisStyle
.GetTextColour().GetAsString(wxC2S_HTML_SYNTAX
)); 
 209             style 
+= wxString::Format(wxT("color: %s"), color
.c_str()); 
 211         if (bTextColourChanged 
&& bBackgroundColourChanged
) 
 213         if (bBackgroundColourChanged
) 
 215             wxString 
color(thisStyle
.GetBackgroundColour().GetAsString(wxC2S_HTML_SYNTAX
)); 
 216             style 
+= wxString::Format(wxT("background-color: %s"), color
.c_str()); 
 224         str 
<< wxString::Format(wxT("<font %s >"), style
.c_str()); 
 228     if (thisStyle
.GetFontWeight() == wxBOLD
) 
 230     if (thisStyle
.GetFontStyle() == wxITALIC
) 
 232     if (thisStyle
.GetFontUnderlined()) 
 235     if (thisStyle
.HasURL()) 
 236         str 
<< wxT("<a href=\"") << thisStyle
.GetURL() << wxT("\">"); 
 238     if (thisStyle
.HasTextEffects()) 
 240         if (thisStyle
.GetTextEffects() & wxTEXT_ATTR_EFFECT_STRIKETHROUGH
) 
 242         if (thisStyle
.GetTextEffects() & wxTEXT_ATTR_EFFECT_SUPERSCRIPT
) 
 244         if (thisStyle
.GetTextEffects() & wxTEXT_ATTR_EFFECT_SUBSCRIPT
) 
 249 void wxRichTextHTMLHandler::EndCharacterFormatting(const wxRichTextAttr
& WXUNUSED(currentStyle
), const wxRichTextAttr
& thisStyle
, const wxRichTextAttr
& WXUNUSED(paraStyle
), wxTextOutputStream
& stream
) 
 251     if (thisStyle
.HasURL()) 
 252         stream 
<< wxT("</a>"); 
 254     if (thisStyle
.GetFontUnderlined()) 
 255         stream 
<< wxT("</u>"); 
 256     if (thisStyle
.GetFontStyle() == wxITALIC
) 
 257         stream 
<< wxT("</i>"); 
 258     if (thisStyle
.GetFontWeight() == wxBOLD
) 
 259         stream 
<< wxT("</b>"); 
 261     if (thisStyle
.HasTextEffects()) 
 263         if (thisStyle
.GetTextEffects() & wxTEXT_ATTR_EFFECT_STRIKETHROUGH
) 
 264             stream 
<< wxT("</del>"); 
 265         if (thisStyle
.GetTextEffects() & wxTEXT_ATTR_EFFECT_SUPERSCRIPT
) 
 266             stream 
<< wxT("</sup>"); 
 267         if (thisStyle
.GetTextEffects() & wxTEXT_ATTR_EFFECT_SUBSCRIPT
) 
 268             stream 
<< wxT("</sub>"); 
 274         stream 
<< wxT("</font>"); 
 278 /// Begin paragraph formatting 
 279 void wxRichTextHTMLHandler::BeginParagraphFormatting(const wxRichTextAttr
& WXUNUSED(currentStyle
), const wxRichTextAttr
& thisStyle
, wxTextOutputStream
& str
) 
 281     if (thisStyle
.HasPageBreak()) 
 283         str 
<< wxT("<div style=\"page-break-after:always\"></div>\n"); 
 286     if (thisStyle
.HasLeftIndent() && thisStyle
.GetLeftIndent() != 0) 
 288         if (thisStyle
.HasBulletStyle()) 
 290             int indent 
= thisStyle
.GetLeftIndent(); 
 292             // Close levels high than this 
 293             CloseLists(indent
, str
); 
 295             if (m_indents
.GetCount() > 0 && indent 
== m_indents
.Last()) 
 297                 // Same level, no need to start a new list 
 299             else if (m_indents
.GetCount() == 0 || indent 
> m_indents
.Last()) 
 301                 m_indents
.Add(indent
); 
 304                 int listType 
= TypeOfList(thisStyle
, tag
); 
 305                 m_listTypes
.Add(listType
); 
 307                 // wxHTML needs an extra <p> before a list when using <p> ... </p> in previous paragraphs. 
 308                 // TODO: pass a flag that indicates we're using wxHTML. 
 320             wxString align 
= GetAlignment(thisStyle
); 
 321             str 
<< wxString::Format(wxT("<p align=\"%s\""), align
.c_str()); 
 325             if ((GetFlags() & wxRICHTEXT_HANDLER_USE_CSS
) && thisStyle
.HasParagraphSpacingBefore()) 
 327                 float spacingBeforeMM 
= thisStyle
.GetParagraphSpacingBefore() / 10.0; 
 329                 styleStr 
+= wxString::Format(wxT("margin-top: %.2fmm; "), spacingBeforeMM
); 
 331             if ((GetFlags() & wxRICHTEXT_HANDLER_USE_CSS
) && thisStyle
.HasParagraphSpacingAfter()) 
 333                 float spacingAfterMM 
= thisStyle
.GetParagraphSpacingAfter() / 10.0; 
 335                 styleStr 
+= wxString::Format(wxT("margin-bottom: %.2fmm; "), spacingAfterMM
); 
 338             float indentLeftMM 
= (thisStyle
.GetLeftIndent() + thisStyle
.GetLeftSubIndent())/10.0; 
 339             if ((GetFlags() & wxRICHTEXT_HANDLER_USE_CSS
) && (indentLeftMM 
> 0.0)) 
 341                 styleStr 
+= wxString::Format(wxT("margin-left: %.2fmm; "), indentLeftMM
); 
 343             float indentRightMM 
= thisStyle
.GetRightIndent()/10.0; 
 344             if ((GetFlags() & wxRICHTEXT_HANDLER_USE_CSS
) && thisStyle
.HasRightIndent() && (indentRightMM 
> 0.0)) 
 346                 styleStr 
+= wxString::Format(wxT("margin-right: %.2fmm; "), indentRightMM
); 
 348             // First line indentation 
 349             float firstLineIndentMM 
= - thisStyle
.GetLeftSubIndent() / 10.0; 
 350             if ((GetFlags() & wxRICHTEXT_HANDLER_USE_CSS
) && (firstLineIndentMM 
> 0.0)) 
 352                 styleStr 
+= wxString::Format(wxT("text-indent: %.2fmm; "), firstLineIndentMM
); 
 355             if (!styleStr
.IsEmpty()) 
 356                 str 
<< wxT(" style=\"") << styleStr 
<< wxT("\""); 
 360             // TODO: convert to pixels 
 361             int indentPixels 
= static_cast<int>(indentLeftMM
*10/4); 
 363             if ((GetFlags() & wxRICHTEXT_HANDLER_USE_CSS
) == 0) 
 365                 // Use a table to do indenting if we don't have CSS 
 366                 str 
<< wxString::Format(wxT("<table border=0 cellpadding=0 cellspacing=0><tr><td width=\"%d\"></td><td>"), indentPixels
); 
 370             if (((GetFlags() & wxRICHTEXT_HANDLER_USE_CSS
) == 0) && (thisStyle
.GetLeftSubIndent() < 0)) 
 372                 str 
<< SymbolicIndent( - thisStyle
.GetLeftSubIndent()); 
 380         wxString align 
= GetAlignment(thisStyle
); 
 381         str 
<< wxString::Format(wxT("<p align=\"%s\""), align
.c_str()); 
 385         if ((GetFlags() & wxRICHTEXT_HANDLER_USE_CSS
) && thisStyle
.HasParagraphSpacingBefore()) 
 387             float spacingBeforeMM 
= thisStyle
.GetParagraphSpacingBefore() / 10.0; 
 389             styleStr 
+= wxString::Format(wxT("margin-top: %.2fmm; "), spacingBeforeMM
); 
 391         if ((GetFlags() & wxRICHTEXT_HANDLER_USE_CSS
) && thisStyle
.HasParagraphSpacingAfter()) 
 393             float spacingAfterMM 
= thisStyle
.GetParagraphSpacingAfter() / 10.0; 
 395             styleStr 
+= wxString::Format(wxT("margin-bottom: %.2fmm; "), spacingAfterMM
); 
 398         if (!styleStr
.IsEmpty()) 
 399             str 
<< wxT(" style=\"") << styleStr 
<< wxT("\""); 
 403     OutputFont(thisStyle
, str
); 
 406 /// End paragraph formatting 
 407 void wxRichTextHTMLHandler::EndParagraphFormatting(const wxRichTextAttr
& WXUNUSED(currentStyle
), const wxRichTextAttr
& thisStyle
, wxTextOutputStream
& stream
) 
 409     if (thisStyle
.HasFont()) 
 410         stream 
<< wxT("</font>"); 
 414         stream 
<< wxT("</td></tr></table></p>\n"); 
 417     else if (!thisStyle
.HasBulletStyle()) 
 418         stream 
<< wxT("</p>\n"); 
 421 /// Closes lists to level (-1 means close all) 
 422 void wxRichTextHTMLHandler::CloseLists(int level
, wxTextOutputStream
& str
) 
 424     // Close levels high than this 
 425     int i 
= m_indents
.GetCount()-1; 
 428         int l 
= m_indents
[i
]; 
 431             if (m_listTypes
[i
] == 0) 
 435             m_indents
.RemoveAt(i
); 
 436             m_listTypes
.RemoveAt(i
); 
 445 void wxRichTextHTMLHandler::OutputFont(const wxRichTextAttr
& style
, wxTextOutputStream
& stream
) 
 449         stream 
<< wxString::Format(wxT("<font face=\"%s\" size=\"%ld\""), style
.GetFontFaceName().c_str(), PtToSize(style
.GetFontSize())); 
 450         if (style
.HasTextColour()) 
 451             stream 
<< wxString::Format(wxT(" color=\"%s\""), style
.GetTextColour().GetAsString(wxC2S_HTML_SYNTAX
).c_str()); 
 456 int wxRichTextHTMLHandler::TypeOfList( const wxRichTextAttr
& thisStyle
, wxString
& tag 
) 
 458     // We can use number attribute of li tag but not all the browsers support it. 
 459     // also wxHtmlWindow doesn't support type attribute. 
 461     bool m_is_ul 
= false; 
 462     if (thisStyle
.GetBulletStyle() == (wxTEXT_ATTR_BULLET_STYLE_ARABIC
|wxTEXT_ATTR_BULLET_STYLE_PERIOD
)) 
 463         tag 
= wxT("<ol type=\"1\">"); 
 464     else if (thisStyle
.GetBulletStyle() == wxTEXT_ATTR_BULLET_STYLE_LETTERS_UPPER
) 
 465         tag 
= wxT("<ol type=\"A\">"); 
 466     else if (thisStyle
.GetBulletStyle() == wxTEXT_ATTR_BULLET_STYLE_LETTERS_LOWER
) 
 467         tag 
= wxT("<ol type=\"a\">"); 
 468     else if (thisStyle
.GetBulletStyle() == wxTEXT_ATTR_BULLET_STYLE_ROMAN_UPPER
) 
 469         tag 
= wxT("<ol type=\"I\">"); 
 470     else if (thisStyle
.GetBulletStyle() == wxTEXT_ATTR_BULLET_STYLE_ROMAN_LOWER
) 
 471         tag 
= wxT("<ol type=\"i\">"); 
 484 wxString 
wxRichTextHTMLHandler::GetAlignment( const wxRichTextAttr
& thisStyle 
) 
 486     switch( thisStyle
.GetAlignment() ) 
 488     case wxTEXT_ALIGNMENT_LEFT
: 
 490     case wxTEXT_ALIGNMENT_RIGHT
: 
 492     case wxTEXT_ALIGNMENT_CENTER
: 
 493         return wxT("center"); 
 494     case wxTEXT_ALIGNMENT_JUSTIFIED
: 
 495         return wxT("justify"); 
 501 void wxRichTextHTMLHandler::WriteImage(wxRichTextImage
* image
, wxOutputStream
& stream
) 
 503     wxTextOutputStream 
str(stream
); 
 505     str 
<< wxT("<img src=\""); 
 508     if (GetFlags() & wxRICHTEXT_HANDLER_SAVE_IMAGES_TO_MEMORY
) 
 511         if (!image
->GetImage().IsOk() && image
->GetImageBlock().GetData()) 
 512             image
->LoadFromBlock(); 
 513         if (image
->GetImage().IsOk() && !image
->GetImageBlock().GetData()) 
 517         if (image
->GetImageBlock().IsOk()) 
 520             image
->GetImageBlock().Load(img
); 
 523                 wxString 
ext(image
->GetImageBlock().GetExtension()); 
 524                 wxString 
tempFilename(wxString::Format(wxT("image%d.%s"), sm_fileCounter
, ext
)); 
 525                 wxMemoryFSHandler::AddFile(tempFilename
, img
, image
->GetImageBlock().GetImageType()); 
 527                 m_imageLocations
.Add(tempFilename
); 
 529                 str 
<< wxT("memory:") << tempFilename
; 
 533             str 
<< wxT("memory:?"); 
 537     else if (GetFlags() & wxRICHTEXT_HANDLER_SAVE_IMAGES_TO_FILES
) 
 540         if (!image
->GetImage().IsOk() && image
->GetImageBlock().GetData()) 
 541             image
->LoadFromBlock(); 
 542         if (image
->GetImage().IsOk() && !image
->GetImageBlock().GetData()) 
 546         if (image
->GetImageBlock().IsOk()) 
 548             wxString 
tempDir(GetTempDir()); 
 549             if (tempDir
.IsEmpty()) 
 550                 tempDir 
= wxFileName::GetTempDir(); 
 552             wxString 
ext(image
->GetImageBlock().GetExtension()); 
 553             wxString 
tempFilename(wxString::Format(wxT("%s/image%d.%s"), tempDir
, sm_fileCounter
, ext
)); 
 554             image
->GetImageBlock().Write(tempFilename
); 
 556             m_imageLocations
.Add(tempFilename
); 
 558             str 
<< wxFileSystem::FileNameToURL(tempFilename
); 
 561             str 
<< wxT("file:?"); 
 565     else // if (GetFlags() & wxRICHTEXT_HANDLER_SAVE_IMAGES_TO_BASE64) // this is implied 
 569         str 
<< GetMimeType(image
->GetImageBlock().GetImageType()); 
 570         str 
<< wxT(";base64,"); 
 572         if (image
->GetImage().IsOk() && !image
->GetImageBlock().GetData()) 
 575         if (image
->GetImageBlock().IsOk()) 
 577             wxChar
* data 
= b64enc( image
->GetImageBlock().GetData(), image
->GetImageBlock().GetDataSize() ); 
 587 long wxRichTextHTMLHandler::PtToSize(long size
) 
 590     int len 
= m_fontSizeMapping
.GetCount(); 
 591     for (i 
= 0; i 
< len
; i
++) 
 592         if (size 
<= m_fontSizeMapping
[i
]) 
 597 wxString 
wxRichTextHTMLHandler::SymbolicIndent(long indent
) 
 600     for(;indent 
> 0; indent 
-= 20) 
 601         in
.Append( wxT(" ") ); 
 605 const wxChar
* wxRichTextHTMLHandler::GetMimeType(int imageType
) 
 609     case wxBITMAP_TYPE_BMP
: 
 610         return wxT("image/bmp"); 
 611     case wxBITMAP_TYPE_TIFF
: 
 612         return wxT("image/tiff"); 
 613     case wxBITMAP_TYPE_GIF
: 
 614         return wxT("image/gif"); 
 615     case wxBITMAP_TYPE_PNG
: 
 616         return wxT("image/png"); 
 617     case wxBITMAP_TYPE_JPEG
: 
 618         return wxT("image/jpeg"); 
 620         return wxT("image/unknown"); 
 624 // exim-style base64 encoder 
 625 wxChar
* wxRichTextHTMLHandler::b64enc( unsigned char* input
, size_t in_len 
) 
 627     // elements of enc64 array must be 8 bit values 
 628     // otherwise encoder will fail 
 629     // hmmm.. Does wxT macro define a char as 16 bit value 
 630     // when compiling with UNICODE option? 
 631     static const wxChar enc64
[] = wxT("ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789+/"); 
 632     wxChar
* output 
= new wxChar
[4*((in_len
+2)/3)+1]; 
 635     while( in_len
-- > 0 ) 
 637         register wxChar a
, b
; 
 641         *p
++ = enc64
[ (a 
>> 2) & 0x3f ]; 
 645             *p
++ = enc64
[ (a 
<< 4 ) & 0x30 ]; 
 653         *p
++ = enc64
[(( a 
<< 4 ) | ((b 
>> 4) &0xf )) & 0x3f]; 
 657             *p
++ = enc64
[ (b 
<< 2) & 0x3f ]; 
 664         *p
++ = enc64
[ ((( b 
<< 2 ) & 0x3f ) | ((a 
>> 6)& 0x3)) & 0x3f ]; 
 666         *p
++ = enc64
[ a 
& 0x3f ]; 
 675 /// Delete the in-memory or temporary files generated by the last operation 
 676 bool wxRichTextHTMLHandler::DeleteTemporaryImages() 
 678     return DeleteTemporaryImages(GetFlags(), m_imageLocations
); 
 681 /// Delete the in-memory or temporary files generated by the last operation 
 682 bool wxRichTextHTMLHandler::DeleteTemporaryImages(int flags
, const wxArrayString
& imageLocations
) 
 685     for (i 
= 0; i 
< imageLocations
.GetCount(); i
++) 
 687         wxString location 
= imageLocations
[i
]; 
 689         if (flags 
& wxRICHTEXT_HANDLER_SAVE_IMAGES_TO_MEMORY
) 
 692             wxMemoryFSHandler::RemoveFile(location
); 
 695         else if (flags 
& wxRICHTEXT_HANDLER_SAVE_IMAGES_TO_FILES
) 
 697             if (wxFileExists(location
)) 
 698                 wxRemoveFile(location
);