1 /////////////////////////////////////////////////////////////////////////////
2 // Name: src/richtext/richtexthtml.cpp
3 // Purpose: HTML I/O for wxRichTextCtrl
4 // Author: Julian Smart
8 // Copyright: (c) Julian Smart
9 // Licence: wxWindows licence
10 /////////////////////////////////////////////////////////////////////////////
12 // For compilers that support precompilation, includes "wx.h".
13 #include "wx/wxprec.h"
21 #include "wx/richtext/richtexthtml.h"
26 #include "wx/filename.h"
27 #include "wx/wfstream.h"
28 #include "wx/txtstrm.h"
30 IMPLEMENT_DYNAMIC_CLASS(wxRichTextHTMLHandler
, wxRichTextFileHandler
)
32 /// Can we handle this filename (if using files)? By default, checks the extension.
33 bool wxRichTextHTMLHandler::CanHandle(const wxString
& filename
) const
35 wxString path
, file
, ext
;
36 wxSplitPath(filename
, & path
, & file
, & ext
);
38 return (ext
.Lower() == wxT("html") || ext
.Lower() == wxT("htm"));
43 bool wxRichTextHTMLHandler::DoLoadFile(wxRichTextBuffer
*WXUNUSED(buffer
), wxInputStream
& WXUNUSED(stream
))
49 * We need to output only _changes_ in character formatting.
52 bool wxRichTextHTMLHandler::DoSaveFile(wxRichTextBuffer
*buffer
, wxOutputStream
& stream
)
56 wxTextOutputStream
str(stream
);
58 wxTextAttrEx currentParaStyle
= buffer
->GetAttributes();
59 wxTextAttrEx currentCharStyle
= buffer
->GetAttributes();
61 str
<< wxT("<html><head></head><body>\n");
64 wxRichText may be support paper formats like a1/a2/a3/a4
65 when this widget grown enough, i should turn back and support its new features
68 str << wxT("<table border=0 cellpadding=0 cellspacing=0><tr><td>");
70 wxString left_indent = SymbolicIndent(currentParaStyle.GetLeftIndent());
71 wxString right_indent = SymbolicIndent(currentParaStyle.GetRightIndent());
73 str << wxString::Format(wxT("%s</td><td></td><td>%s</td></tr><tr>"),
74 left_indent.c_str(), //Document-Wide Left Indent
75 right_indent.c_str()); //Document-Wide Right Indent
77 str << wxT("<td></td><td width=\"100%\">");
80 str
<< wxT("<table border=0 cellpadding=0 cellspacing=0><tr><td width=\"100%\">");
82 str
<< wxString::Format(wxT("<font face=\"%s\" size=\"%ld\" color=\"%s\" >"),
83 currentParaStyle
.GetFont().GetFaceName().c_str(), Pt_To_Size( currentParaStyle
.GetFont().GetPointSize() ),
84 currentParaStyle
.GetTextColour().GetAsString(wxC2S_HTML_SYNTAX
).c_str());
86 //wxString align = GetAlignment( currentParaStyle.GetAlignment() );
87 //str << wxString::Format(wxT("<p align=\"%s\">"), align );
93 wxRichTextObjectList::compatibility_iterator node
= buffer
->GetChildren().GetFirst();
96 wxRichTextParagraph
* para
= wxDynamicCast(node
->GetData(), wxRichTextParagraph
);
97 wxASSERT (para
!= NULL
);
101 wxTextAttrEx
paraStyle(para
->GetCombinedAttributes());
103 OutputParagraphFormatting(currentParaStyle
, paraStyle
, stream
);
105 wxRichTextObjectList::compatibility_iterator node2
= para
->GetChildren().GetFirst();
108 wxRichTextObject
* obj
= node2
->GetData();
109 wxRichTextPlainText
* textObj
= wxDynamicCast(obj
, wxRichTextPlainText
);
110 if (textObj
&& !textObj
->IsEmpty())
112 wxTextAttrEx
charStyle(para
->GetCombinedAttributes(obj
->GetAttributes()));
113 BeginCharacterFormatting(currentCharStyle
, charStyle
, paraStyle
, stream
);
115 str
<< textObj
->GetText();
117 EndCharacterFormatting(currentCharStyle
, charStyle
, paraStyle
, stream
);
120 wxRichTextImage
* image
= wxDynamicCast(obj
, wxRichTextImage
);
121 if( image
&& !image
->IsEmpty())
122 Image_to_Base64( image
, stream
);
124 node2
= node2
->GetNext();
127 //OutputParagraphFormatting(currentParaStyle, para->GetAttributes(), stream, false);
129 node
= node
->GetNext();
132 str
<< wxT("</font></td></tr></table></body></html>\n");
137 void wxRichTextHTMLHandler::BeginCharacterFormatting(const wxTextAttrEx
& currentStyle
, const wxTextAttrEx
& thisStyle
, const wxTextAttrEx
& paraStyle
, wxOutputStream
& stream
)
139 wxTextOutputStream
str(stream
);
141 //Is the item bulleted one?
142 if( paraStyle
.GetBulletStyle() != wxTEXT_ATTR_BULLET_STYLE_NONE
)
144 //Is there any opened list?
149 //Is the item among the previous ones
150 //Is the item one of the previous list tag's child items
151 if( (paraStyle
.GetLeftIndent() == (m_indent
+ 100)) || (paraStyle
.GetLeftIndent() < 100) )
152 str
<< wxT("<li>");//Yes it is
157 //So we should close the list tag
158 str
<< (m_is_ul
? wxT("</ul>") : wxT("</ol>"));
160 //And renavigate to new list's horizontal position
161 NavigateToListPosition(paraStyle
, str
);
164 //Get the appropriate tag, an ol for numerical values, an ul for dot, square etc.
166 TypeOfList(paraStyle
, tag
);
167 str
<< tag
<< wxT("<li>");
172 //No there isn't a list
174 //navigate to new list's horizontal position(indent)
175 NavigateToListPosition(paraStyle
, str
);
177 //Get the appropriate tag, an ol for numerical values, an ul for dot, square etc.
179 TypeOfList(paraStyle
, tag
);
180 str
<< tag
<< wxT("<li>");
182 //Now we have a list, mark it.
188 //The item is not bulleted and there is a list what should be closed now.
191 str
<< (m_is_ul
? wxT("</ul>") : wxT("</ol>"));
192 //And mark as there is no an opened list
196 // does the item have an indentation ?
197 if( paraStyle
.GetLeftIndent() )
199 if( paraStyle
.GetBulletStyle() == wxTEXT_ATTR_BULLET_STYLE_NONE
)
203 if( (paraStyle
.GetLeftIndent() + paraStyle
.GetLeftSubIndent()) == m_indent
)
205 if( paraStyle
.GetLeftSubIndent() < 0 )
207 str
<< SymbolicIndent(~paraStyle
.GetLeftSubIndent());
212 if( paraStyle
.GetLeftIndent() + paraStyle
.GetLeftSubIndent() > m_indent
)
214 Indent(paraStyle
, str
);
215 m_indent
= paraStyle
.GetLeftIndent() + paraStyle
.GetLeftSubIndent();
216 m_indents
.Add( m_indent
);
220 int i
= m_indents
.size() - 1;
223 if( m_indent
< (paraStyle
.GetLeftIndent() + paraStyle
.GetLeftSubIndent()) )
225 Indent(paraStyle
, str
);
226 m_indent
= paraStyle
.GetLeftIndent() + paraStyle
.GetLeftSubIndent();
227 m_indents
.Add( m_indent
);
231 else if( m_indent
== (paraStyle
.GetLeftIndent() + paraStyle
.GetLeftSubIndent()) )
233 if( paraStyle
.GetLeftSubIndent() < 0 )
235 str
<< SymbolicIndent(~paraStyle
.GetLeftSubIndent());
241 str
<< wxT("</td></tr></table>");
243 m_indents
.RemoveAt(i
);
245 if( i
< 1 ){m_indent
=0; break;}
246 m_indent
= m_indents
[i
-1];
254 Indent(paraStyle
, str
);
255 m_indent
= paraStyle
.GetLeftIndent() + paraStyle
.GetLeftSubIndent();
256 m_indents
.Add( m_indent
);
262 //The item is not indented and there is a table(s) what should be closed now.
265 for(unsigned int i
= 0; i
< m_indents
.size(); i
++ )
266 str
<< wxT("</td></tr></table>");
275 //Is there any change on the font properties of the item
276 if( thisStyle
.GetFont().GetFaceName() != currentStyle
.GetFont().GetFaceName() )
277 style
+= wxString::Format(wxT(" face=\"%s\""), thisStyle
.GetFont().GetFaceName().c_str());
278 if( thisStyle
.GetFont().GetPointSize() != currentStyle
.GetFont().GetPointSize() )
279 style
+= wxString::Format(wxT(" size=\"%ld\""), Pt_To_Size(thisStyle
.GetFont().GetPointSize()) );
280 if( thisStyle
.GetTextColour() != currentStyle
.GetTextColour() )
281 style
+= wxString::Format(wxT(" color=\"%s\""), thisStyle
.GetTextColour().GetAsString(wxC2S_HTML_SYNTAX
).c_str());
285 str
<< wxString::Format(wxT("<font %s >"), style
.c_str());
289 if( thisStyle
.GetFont().GetWeight() == wxBOLD
)
291 if( thisStyle
.GetFont().GetStyle() == wxITALIC
)
293 if( thisStyle
.GetFont().GetUnderlined() )
297 void wxRichTextHTMLHandler::EndCharacterFormatting(const wxTextAttrEx
& WXUNUSED(currentStyle
), const wxTextAttrEx
& thisStyle
, const wxTextAttrEx
& WXUNUSED(paraStyle
), wxOutputStream
& stream
)
299 wxTextOutputStream
str(stream
);
301 if( thisStyle
.GetFont().GetUnderlined() )
303 if( thisStyle
.GetFont().GetStyle() == wxITALIC
)
305 if( thisStyle
.GetFont().GetWeight() == wxBOLD
)
311 str
<< wxT("</font>");
315 /// Output paragraph formatting
316 void wxRichTextHTMLHandler::OutputParagraphFormatting(const wxTextAttrEx
& WXUNUSED(currentStyle
), const wxTextAttrEx
& thisStyle
, wxOutputStream
& stream
)
318 //If there is no opened list currently, insert a <p> after every paragraph
321 wxTextOutputStream
str(stream
);
322 wxString align
= GetAlignment( thisStyle
);
323 str
<< wxString::Format(wxT("<p align=\"%s\">"), align
.c_str());
327 void wxRichTextHTMLHandler::NavigateToListPosition(const wxTextAttrEx
& thisStyle
, wxTextOutputStream
& str
)
329 //indenting an item using an ul/ol tag is equal to inserting 5 x on its left side.
330 //so we should start from 100 point left
332 //Is the second td's left wall of the current indentaion table at the 100+ point-left-side
333 //of the item, horizontally?
334 if( m_indent
+ 100 < thisStyle
.GetLeftIndent() )
337 LIndent(thisStyle
, str
);
338 m_indent
= thisStyle
.GetLeftIndent() - 100;
339 m_indents
.Add( m_indent
);
344 int i
= m_indents
.size() - 1;
347 //Is the second td's left wall of the current indentaion table at the 100+ point-left-side
349 if( m_indent
+ 100 < thisStyle
.GetLeftIndent() )
352 LIndent(thisStyle
, str
);
353 m_indent
= thisStyle
.GetLeftIndent() - 100;
354 m_indents
.Add( m_indent
);
357 else if( m_indent
+ 100 == thisStyle
.GetLeftIndent() )
361 //No it is not, the second td's left wall of the current indentaion table is at the
362 //right side of the current item horizontally, so close it.
363 str
<< wxT("</td></tr></table>");
365 m_indents
.RemoveAt(i
);
367 if( i
< 1 ){m_indent
=0; break;}
368 m_indent
= m_indents
[i
-1];
372 void wxRichTextHTMLHandler::Indent( const wxTextAttrEx
& thisStyle
, wxTextOutputStream
& str
)
374 //As a five year experienced web developer i assure you there is no way to indent an item
375 //in html way, but we can use tables.
379 //Item -> "Hello world"
380 //Its Left Indentation -> 100
381 //Its Left Sub-Indentation ->40
382 //A typical indentation-table for the item will be construct as the following
386 //LSI = Left Sub Indent
387 //LI = Left Indent - LSI
389 //-------------------------------------------
390 //| nbsp;|nbsp;nbsp;Hello World |
393 //| --LI-- | --LSI-- |
394 //-------------------------------------------
396 str
<< wxT("<table width=\"100%\" border=\"0\" cellpadding=\"0\" cellspacing=\"0\"><tr>");
398 wxString symbolic_indent
= SymbolicIndent( (thisStyle
.GetLeftIndent() + thisStyle
.GetLeftSubIndent()) - m_indent
);
399 str
<< wxString::Format( wxT("<td>%s</td>"), symbolic_indent
.c_str() );
400 str
<< wxT("<td width=\"100%\">");
402 if( thisStyle
.GetLeftSubIndent() < 0 )
404 str
<< SymbolicIndent(~thisStyle
.GetLeftSubIndent());
408 void wxRichTextHTMLHandler::LIndent( const wxTextAttrEx
& thisStyle
, wxTextOutputStream
& str
)
411 //r.BeginNumberedBullet(1, 200, 60);
413 //r.WriteText(wxT("first item"));
414 //r.EndNumberedBullet();
415 //r.BeginNumberedBullet(2, 200, 60);
417 //r.WriteText(wxT("second item."));
418 //r.EndNumberedBullet();
420 //A typical indentation-table for the item will be construct as the following
422 //1 x nbsp = 20 point
423 //ULI -> 100pt (UL/OL tag indents its sub element by 100 point)
424 //<--------- 100 pt ---------->|
425 //------------------------------------------------------
426 //| nbsp; nbsp;|<ul> |
427 //| |<-ULI-><li>first item |
428 //| |<-ULI-><li>second item |
430 //------------------------------------------------------
434 str
<< wxT("<table width=\"100%\" border=\"0\" cellpadding=\"0\" cellspacing=\"0\"><tr>");
436 wxString symbolic_indent
= SymbolicIndent( (thisStyle
.GetLeftIndent() - m_indent
) - 100);
437 str
<< wxString::Format( wxT("<td>%s</td>"), symbolic_indent
.c_str() );
438 str
<< wxT("<td width=\"100%\">");
441 void wxRichTextHTMLHandler::TypeOfList( const wxTextAttrEx
& thisStyle
, wxString
& tag
)
443 //We can use number attribute of li tag but not all the browsers support it.
444 //also wxHtmlWindow doesn't support type attribute.
447 if( thisStyle
.GetBulletStyle() == (wxTEXT_ATTR_BULLET_STYLE_ARABIC
|wxTEXT_ATTR_BULLET_STYLE_PERIOD
))
448 tag
= wxT("<ol type=\"1\">");
449 else if( thisStyle
.GetBulletStyle() == wxTEXT_ATTR_BULLET_STYLE_LETTERS_UPPER
)
450 tag
= wxT("<ol type=\"A\">");
451 else if( thisStyle
.GetBulletStyle() == wxTEXT_ATTR_BULLET_STYLE_LETTERS_LOWER
)
452 tag
= wxT("<ol type=\"a\">");
453 else if( thisStyle
.GetBulletStyle() == wxTEXT_ATTR_BULLET_STYLE_ROMAN_UPPER
)
454 tag
= wxT("<ol type=\"I\">");
455 else if( thisStyle
.GetBulletStyle() == wxTEXT_ATTR_BULLET_STYLE_ROMAN_LOWER
)
456 tag
= wxT("<ol type=\"i\">");
464 wxString
wxRichTextHTMLHandler::GetAlignment( const wxTextAttrEx
& thisStyle
)
466 switch( thisStyle
.GetAlignment() )
468 case wxTEXT_ALIGNMENT_LEFT
:
470 case wxTEXT_ALIGNMENT_RIGHT
:
472 case wxTEXT_ALIGNMENT_CENTER
:
473 return wxT("center");
474 case wxTEXT_ALIGNMENT_JUSTIFIED
:
475 return wxT("justify");
481 void wxRichTextHTMLHandler::Image_to_Base64(wxRichTextImage
* image
, wxOutputStream
& stream
)
483 wxTextOutputStream
str(stream
);
485 str
<< wxT("<img src=\"");
487 str
<< GetMimeType(image
->GetImageBlock().GetImageType());
488 str
<< wxT(";base64,");
490 if (image
->GetImage().Ok() && !image
->GetImageBlock().GetData())
493 wxChar
* data
= b64enc( image
->GetImageBlock().GetData(), image
->GetImageBlock().GetDataSize() );
501 long wxRichTextHTMLHandler::Pt_To_Size(long size
)
503 //return most approximate size
504 if(size
< 9 ) return 1;
505 else if( size
< 11 ) return 2;
506 else if( size
< 14 ) return 3;
507 else if( size
< 18 ) return 4;
508 else if( size
< 23 ) return 5;
509 else if( size
< 30 ) return 6;
513 wxString
wxRichTextHTMLHandler::SymbolicIndent(long indent
)
516 for(;indent
> 0; indent
-= 20)
517 in
.Append( wxT(" ") );
521 const wxChar
* wxRichTextHTMLHandler::GetMimeType(int imageType
)
525 case wxBITMAP_TYPE_BMP
:
526 return wxT("image/bmp");
527 case wxBITMAP_TYPE_TIF
:
528 return wxT("image/tiff");
529 case wxBITMAP_TYPE_GIF
:
530 return wxT("image/gif");
531 case wxBITMAP_TYPE_PNG
:
532 return wxT("image/png");
533 case wxBITMAP_TYPE_JPEG
:
534 return wxT("image/jpeg");
536 return wxT("image/unknown");
540 //exim-style base64 encoder
541 wxChar
* wxRichTextHTMLHandler::b64enc( unsigned char* input
, size_t in_len
)
543 //elements of enc64 array must be 8 bit values
544 //otherwise encoder will fail
545 //hmmm.. Does wxT macro define a char as 16 bit value
546 //when compiling with UNICODE option?
547 static const wxChar enc64
[] = wxT("ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789+/");
548 wxChar
* output
= new wxChar
[4*((in_len
+2)/3)+1];
551 while( in_len
-- > 0 )
553 register wxChar a
, b
;
557 *p
++ = enc64
[ (a
>> 2) & 0x3f ];
561 *p
++ = enc64
[ (a
<< 4 ) & 0x30 ];
569 *p
++ = enc64
[(( a
<< 4 ) | ((b
>> 4) &0xf )) & 0x3f];
573 *p
++ = enc64
[ (b
<< 2) & 0x3f ];
580 *p
++ = enc64
[ ((( b
<< 2 ) & 0x3f ) | ((a
>> 6)& 0x3)) & 0x3f ];
582 *p
++ = enc64
[ a
& 0x3f ];