1 /////////////////////////////////////////////////////////////////////////////
2 // Name: src/common/translation.cpp
3 // Purpose: Internationalization and localisation for wxWidgets
4 // Author: Vadim Zeitlin, Vaclav Slavik,
5 // Michael N. Filippov <michael@idisys.iae.nsk.su>
6 // (2003/09/30 - PluralForms support)
9 // Copyright: (c) 1998 Vadim Zeitlin <zeitlin@dptmaths.ens-cachan.fr>
10 // Licence: wxWindows licence
11 /////////////////////////////////////////////////////////////////////////////
13 // ============================================================================
15 // ============================================================================
17 // ----------------------------------------------------------------------------
19 // ----------------------------------------------------------------------------
21 // For compilers that support precompilation, includes "wx.h".
22 #include "wx/wxprec.h"
31 #include "wx/dynarray.h"
32 #include "wx/string.h"
36 #include "wx/hashmap.h"
37 #include "wx/module.h"
45 #include "wx/filename.h"
46 #include "wx/tokenzr.h"
47 #include "wx/fontmap.h"
48 #include "wx/scopedptr.h"
49 #include "wx/stdpaths.h"
50 #include "wx/hashset.h"
52 // ----------------------------------------------------------------------------
54 // ----------------------------------------------------------------------------
56 typedef wxUint32 size_t32
;
58 // ----------------------------------------------------------------------------
60 // ----------------------------------------------------------------------------
62 // magic number identifying the .mo format file
63 const size_t32 MSGCATALOG_MAGIC
= 0x950412de;
64 const size_t32 MSGCATALOG_MAGIC_SW
= 0xde120495;
66 #define TRACE_I18N wxS("i18n")
68 // ============================================================================
70 // ============================================================================
72 // ----------------------------------------------------------------------------
73 // Plural forms parser
74 // ----------------------------------------------------------------------------
80 LogicalOrExpression '?' Expression ':' Expression
84 LogicalAndExpression "||" LogicalOrExpression // to (a || b) || c
88 EqualityExpression "&&" LogicalAndExpression // to (a && b) && c
92 RelationalExpression "==" RelationalExperession
93 RelationalExpression "!=" RelationalExperession
97 MultiplicativeExpression '>' MultiplicativeExpression
98 MultiplicativeExpression '<' MultiplicativeExpression
99 MultiplicativeExpression ">=" MultiplicativeExpression
100 MultiplicativeExpression "<=" MultiplicativeExpression
101 MultiplicativeExpression
103 MultiplicativeExpression:
104 PmExpression '%' PmExpression
113 class wxPluralFormsToken
118 T_ERROR
, T_EOF
, T_NUMBER
, T_N
, T_PLURAL
, T_NPLURALS
, T_EQUAL
, T_ASSIGN
,
119 T_GREATER
, T_GREATER_OR_EQUAL
, T_LESS
, T_LESS_OR_EQUAL
,
120 T_REMINDER
, T_NOT_EQUAL
,
121 T_LOGICAL_AND
, T_LOGICAL_OR
, T_QUESTION
, T_COLON
, T_SEMICOLON
,
122 T_LEFT_BRACKET
, T_RIGHT_BRACKET
124 Type
type() const { return m_type
; }
125 void setType(Type type
) { m_type
= type
; }
128 Number
number() const { return m_number
; }
129 void setNumber(Number num
) { m_number
= num
; }
136 class wxPluralFormsScanner
139 wxPluralFormsScanner(const char* s
);
140 const wxPluralFormsToken
& token() const { return m_token
; }
141 bool nextToken(); // returns false if error
144 wxPluralFormsToken m_token
;
147 wxPluralFormsScanner::wxPluralFormsScanner(const char* s
) : m_s(s
)
152 bool wxPluralFormsScanner::nextToken()
154 wxPluralFormsToken::Type type
= wxPluralFormsToken::T_ERROR
;
155 while (isspace((unsigned char) *m_s
))
161 type
= wxPluralFormsToken::T_EOF
;
163 else if (isdigit((unsigned char) *m_s
))
165 wxPluralFormsToken::Number number
= *m_s
++ - '0';
166 while (isdigit((unsigned char) *m_s
))
168 number
= number
* 10 + (*m_s
++ - '0');
170 m_token
.setNumber(number
);
171 type
= wxPluralFormsToken::T_NUMBER
;
173 else if (isalpha((unsigned char) *m_s
))
175 const char* begin
= m_s
++;
176 while (isalnum((unsigned char) *m_s
))
180 size_t size
= m_s
- begin
;
181 if (size
== 1 && memcmp(begin
, "n", size
) == 0)
183 type
= wxPluralFormsToken::T_N
;
185 else if (size
== 6 && memcmp(begin
, "plural", size
) == 0)
187 type
= wxPluralFormsToken::T_PLURAL
;
189 else if (size
== 8 && memcmp(begin
, "nplurals", size
) == 0)
191 type
= wxPluralFormsToken::T_NPLURALS
;
194 else if (*m_s
== '=')
200 type
= wxPluralFormsToken::T_EQUAL
;
204 type
= wxPluralFormsToken::T_ASSIGN
;
207 else if (*m_s
== '>')
213 type
= wxPluralFormsToken::T_GREATER_OR_EQUAL
;
217 type
= wxPluralFormsToken::T_GREATER
;
220 else if (*m_s
== '<')
226 type
= wxPluralFormsToken::T_LESS_OR_EQUAL
;
230 type
= wxPluralFormsToken::T_LESS
;
233 else if (*m_s
== '%')
236 type
= wxPluralFormsToken::T_REMINDER
;
238 else if (*m_s
== '!' && m_s
[1] == '=')
241 type
= wxPluralFormsToken::T_NOT_EQUAL
;
243 else if (*m_s
== '&' && m_s
[1] == '&')
246 type
= wxPluralFormsToken::T_LOGICAL_AND
;
248 else if (*m_s
== '|' && m_s
[1] == '|')
251 type
= wxPluralFormsToken::T_LOGICAL_OR
;
253 else if (*m_s
== '?')
256 type
= wxPluralFormsToken::T_QUESTION
;
258 else if (*m_s
== ':')
261 type
= wxPluralFormsToken::T_COLON
;
262 } else if (*m_s
== ';') {
264 type
= wxPluralFormsToken::T_SEMICOLON
;
266 else if (*m_s
== '(')
269 type
= wxPluralFormsToken::T_LEFT_BRACKET
;
271 else if (*m_s
== ')')
274 type
= wxPluralFormsToken::T_RIGHT_BRACKET
;
276 m_token
.setType(type
);
277 return type
!= wxPluralFormsToken::T_ERROR
;
280 class wxPluralFormsNode
;
282 // NB: Can't use wxDEFINE_SCOPED_PTR_TYPE because wxPluralFormsNode is not
283 // fully defined yet:
284 class wxPluralFormsNodePtr
287 wxPluralFormsNodePtr(wxPluralFormsNode
*p
= NULL
) : m_p(p
) {}
288 ~wxPluralFormsNodePtr();
289 wxPluralFormsNode
& operator*() const { return *m_p
; }
290 wxPluralFormsNode
* operator->() const { return m_p
; }
291 wxPluralFormsNode
* get() const { return m_p
; }
292 wxPluralFormsNode
* release();
293 void reset(wxPluralFormsNode
*p
);
296 wxPluralFormsNode
*m_p
;
299 class wxPluralFormsNode
302 wxPluralFormsNode(const wxPluralFormsToken
& token
) : m_token(token
) {}
303 const wxPluralFormsToken
& token() const { return m_token
; }
304 const wxPluralFormsNode
* node(unsigned i
) const
305 { return m_nodes
[i
].get(); }
306 void setNode(unsigned i
, wxPluralFormsNode
* n
);
307 wxPluralFormsNode
* releaseNode(unsigned i
);
308 wxPluralFormsToken::Number
evaluate(wxPluralFormsToken::Number n
) const;
311 wxPluralFormsToken m_token
;
312 wxPluralFormsNodePtr m_nodes
[3];
315 wxPluralFormsNodePtr::~wxPluralFormsNodePtr()
319 wxPluralFormsNode
* wxPluralFormsNodePtr::release()
321 wxPluralFormsNode
*p
= m_p
;
325 void wxPluralFormsNodePtr::reset(wxPluralFormsNode
*p
)
335 void wxPluralFormsNode::setNode(unsigned i
, wxPluralFormsNode
* n
)
340 wxPluralFormsNode
* wxPluralFormsNode::releaseNode(unsigned i
)
342 return m_nodes
[i
].release();
345 wxPluralFormsToken::Number
346 wxPluralFormsNode::evaluate(wxPluralFormsToken::Number n
) const
348 switch (token().type())
351 case wxPluralFormsToken::T_NUMBER
:
352 return token().number();
353 case wxPluralFormsToken::T_N
:
356 case wxPluralFormsToken::T_EQUAL
:
357 return node(0)->evaluate(n
) == node(1)->evaluate(n
);
358 case wxPluralFormsToken::T_NOT_EQUAL
:
359 return node(0)->evaluate(n
) != node(1)->evaluate(n
);
360 case wxPluralFormsToken::T_GREATER
:
361 return node(0)->evaluate(n
) > node(1)->evaluate(n
);
362 case wxPluralFormsToken::T_GREATER_OR_EQUAL
:
363 return node(0)->evaluate(n
) >= node(1)->evaluate(n
);
364 case wxPluralFormsToken::T_LESS
:
365 return node(0)->evaluate(n
) < node(1)->evaluate(n
);
366 case wxPluralFormsToken::T_LESS_OR_EQUAL
:
367 return node(0)->evaluate(n
) <= node(1)->evaluate(n
);
368 case wxPluralFormsToken::T_REMINDER
:
370 wxPluralFormsToken::Number number
= node(1)->evaluate(n
);
373 return node(0)->evaluate(n
) % number
;
380 case wxPluralFormsToken::T_LOGICAL_AND
:
381 return node(0)->evaluate(n
) && node(1)->evaluate(n
);
382 case wxPluralFormsToken::T_LOGICAL_OR
:
383 return node(0)->evaluate(n
) || node(1)->evaluate(n
);
385 case wxPluralFormsToken::T_QUESTION
:
386 return node(0)->evaluate(n
)
387 ? node(1)->evaluate(n
)
388 : node(2)->evaluate(n
);
395 class wxPluralFormsCalculator
398 wxPluralFormsCalculator() : m_nplurals(0), m_plural(0) {}
400 // input: number, returns msgstr index
401 int evaluate(int n
) const;
403 // input: text after "Plural-Forms:" (e.g. "nplurals=2; plural=(n != 1);"),
404 // if s == 0, creates default handler
405 // returns 0 if error
406 static wxPluralFormsCalculator
* make(const char* s
= 0);
408 ~wxPluralFormsCalculator() {}
410 void init(wxPluralFormsToken::Number nplurals
, wxPluralFormsNode
* plural
);
413 wxPluralFormsToken::Number m_nplurals
;
414 wxPluralFormsNodePtr m_plural
;
417 wxDEFINE_SCOPED_PTR_TYPE(wxPluralFormsCalculator
)
419 void wxPluralFormsCalculator::init(wxPluralFormsToken::Number nplurals
,
420 wxPluralFormsNode
* plural
)
422 m_nplurals
= nplurals
;
423 m_plural
.reset(plural
);
426 int wxPluralFormsCalculator::evaluate(int n
) const
428 if (m_plural
.get() == 0)
432 wxPluralFormsToken::Number number
= m_plural
->evaluate(n
);
433 if (number
< 0 || number
> m_nplurals
)
441 class wxPluralFormsParser
444 wxPluralFormsParser(wxPluralFormsScanner
& scanner
) : m_scanner(scanner
) {}
445 bool parse(wxPluralFormsCalculator
& rCalculator
);
448 wxPluralFormsNode
* parsePlural();
449 // stops at T_SEMICOLON, returns 0 if error
450 wxPluralFormsScanner
& m_scanner
;
451 const wxPluralFormsToken
& token() const;
454 wxPluralFormsNode
* expression();
455 wxPluralFormsNode
* logicalOrExpression();
456 wxPluralFormsNode
* logicalAndExpression();
457 wxPluralFormsNode
* equalityExpression();
458 wxPluralFormsNode
* multiplicativeExpression();
459 wxPluralFormsNode
* relationalExpression();
460 wxPluralFormsNode
* pmExpression();
463 bool wxPluralFormsParser::parse(wxPluralFormsCalculator
& rCalculator
)
465 if (token().type() != wxPluralFormsToken::T_NPLURALS
)
469 if (token().type() != wxPluralFormsToken::T_ASSIGN
)
473 if (token().type() != wxPluralFormsToken::T_NUMBER
)
475 wxPluralFormsToken::Number nplurals
= token().number();
478 if (token().type() != wxPluralFormsToken::T_SEMICOLON
)
482 if (token().type() != wxPluralFormsToken::T_PLURAL
)
486 if (token().type() != wxPluralFormsToken::T_ASSIGN
)
490 wxPluralFormsNode
* plural
= parsePlural();
493 if (token().type() != wxPluralFormsToken::T_SEMICOLON
)
497 if (token().type() != wxPluralFormsToken::T_EOF
)
499 rCalculator
.init(nplurals
, plural
);
503 wxPluralFormsNode
* wxPluralFormsParser::parsePlural()
505 wxPluralFormsNode
* p
= expression();
510 wxPluralFormsNodePtr
n(p
);
511 if (token().type() != wxPluralFormsToken::T_SEMICOLON
)
518 const wxPluralFormsToken
& wxPluralFormsParser::token() const
520 return m_scanner
.token();
523 bool wxPluralFormsParser::nextToken()
525 if (!m_scanner
.nextToken())
530 wxPluralFormsNode
* wxPluralFormsParser::expression()
532 wxPluralFormsNode
* p
= logicalOrExpression();
535 wxPluralFormsNodePtr
n(p
);
536 if (token().type() == wxPluralFormsToken::T_QUESTION
)
538 wxPluralFormsNodePtr
qn(new wxPluralFormsNode(token()));
549 if (token().type() != wxPluralFormsToken::T_COLON
)
563 qn
->setNode(0, n
.release());
569 wxPluralFormsNode
*wxPluralFormsParser::logicalOrExpression()
571 wxPluralFormsNode
* p
= logicalAndExpression();
574 wxPluralFormsNodePtr
ln(p
);
575 if (token().type() == wxPluralFormsToken::T_LOGICAL_OR
)
577 wxPluralFormsNodePtr
un(new wxPluralFormsNode(token()));
582 p
= logicalOrExpression();
587 wxPluralFormsNodePtr
rn(p
); // right
588 if (rn
->token().type() == wxPluralFormsToken::T_LOGICAL_OR
)
590 // see logicalAndExpression comment
591 un
->setNode(0, ln
.release());
592 un
->setNode(1, rn
->releaseNode(0));
593 rn
->setNode(0, un
.release());
598 un
->setNode(0, ln
.release());
599 un
->setNode(1, rn
.release());
605 wxPluralFormsNode
* wxPluralFormsParser::logicalAndExpression()
607 wxPluralFormsNode
* p
= equalityExpression();
610 wxPluralFormsNodePtr
ln(p
); // left
611 if (token().type() == wxPluralFormsToken::T_LOGICAL_AND
)
613 wxPluralFormsNodePtr
un(new wxPluralFormsNode(token())); // up
618 p
= logicalAndExpression();
623 wxPluralFormsNodePtr
rn(p
); // right
624 if (rn
->token().type() == wxPluralFormsToken::T_LOGICAL_AND
)
626 // transform 1 && (2 && 3) -> (1 && 2) && 3
630 un
->setNode(0, ln
.release());
631 un
->setNode(1, rn
->releaseNode(0));
632 rn
->setNode(0, un
.release());
636 un
->setNode(0, ln
.release());
637 un
->setNode(1, rn
.release());
643 wxPluralFormsNode
* wxPluralFormsParser::equalityExpression()
645 wxPluralFormsNode
* p
= relationalExpression();
648 wxPluralFormsNodePtr
n(p
);
649 if (token().type() == wxPluralFormsToken::T_EQUAL
650 || token().type() == wxPluralFormsToken::T_NOT_EQUAL
)
652 wxPluralFormsNodePtr
qn(new wxPluralFormsNode(token()));
657 p
= relationalExpression();
663 qn
->setNode(0, n
.release());
669 wxPluralFormsNode
* wxPluralFormsParser::relationalExpression()
671 wxPluralFormsNode
* p
= multiplicativeExpression();
674 wxPluralFormsNodePtr
n(p
);
675 if (token().type() == wxPluralFormsToken::T_GREATER
676 || token().type() == wxPluralFormsToken::T_LESS
677 || token().type() == wxPluralFormsToken::T_GREATER_OR_EQUAL
678 || token().type() == wxPluralFormsToken::T_LESS_OR_EQUAL
)
680 wxPluralFormsNodePtr
qn(new wxPluralFormsNode(token()));
685 p
= multiplicativeExpression();
691 qn
->setNode(0, n
.release());
697 wxPluralFormsNode
* wxPluralFormsParser::multiplicativeExpression()
699 wxPluralFormsNode
* p
= pmExpression();
702 wxPluralFormsNodePtr
n(p
);
703 if (token().type() == wxPluralFormsToken::T_REMINDER
)
705 wxPluralFormsNodePtr
qn(new wxPluralFormsNode(token()));
716 qn
->setNode(0, n
.release());
722 wxPluralFormsNode
* wxPluralFormsParser::pmExpression()
724 wxPluralFormsNodePtr n
;
725 if (token().type() == wxPluralFormsToken::T_N
726 || token().type() == wxPluralFormsToken::T_NUMBER
)
728 n
.reset(new wxPluralFormsNode(token()));
734 else if (token().type() == wxPluralFormsToken::T_LEFT_BRACKET
) {
739 wxPluralFormsNode
* p
= expression();
745 if (token().type() != wxPluralFormsToken::T_RIGHT_BRACKET
)
761 wxPluralFormsCalculator
* wxPluralFormsCalculator::make(const char* s
)
763 wxPluralFormsCalculatorPtr
calculator(new wxPluralFormsCalculator
);
766 wxPluralFormsScanner
scanner(s
);
767 wxPluralFormsParser
p(scanner
);
768 if (!p
.parse(*calculator
))
773 return calculator
.release();
779 // ----------------------------------------------------------------------------
780 // wxMsgCatalogFile corresponds to one disk-file message catalog.
782 // This is a "low-level" class and is used only by wxMsgCatalog
783 // NOTE: for the documentation of the binary catalog (.MO) files refer to
784 // the GNU gettext manual:
785 // http://www.gnu.org/software/autoconf/manual/gettext/MO-Files.html
786 // ----------------------------------------------------------------------------
788 WX_DECLARE_EXPORTED_STRING_HASH_MAP(wxString
, wxMessagesHash
);
790 class wxMsgCatalogFile
793 typedef wxScopedCharTypeBuffer
<char> DataBuffer
;
799 // load the catalog from disk
800 bool LoadFile(const wxString
& filename
,
801 wxPluralFormsCalculatorPtr
& rPluralFormsCalculator
);
802 bool LoadData(const DataBuffer
& data
,
803 wxPluralFormsCalculatorPtr
& rPluralFormsCalculator
);
805 // fills the hash with string-translation pairs
806 bool FillHash(wxMessagesHash
& hash
, const wxString
& msgIdCharset
) const;
808 // return the charset of the strings in this catalog or empty string if
810 wxString
GetCharset() const { return m_charset
; }
813 // this implementation is binary compatible with GNU gettext() version 0.10
815 // an entry in the string table
816 struct wxMsgTableEntry
818 size_t32 nLen
; // length of the string
819 size_t32 ofsString
; // pointer to the string
822 // header of a .mo file
823 struct wxMsgCatalogHeader
825 size_t32 magic
, // offset +00: magic id
826 revision
, // +04: revision
827 numStrings
; // +08: number of strings in the file
828 size_t32 ofsOrigTable
, // +0C: start of original string table
829 ofsTransTable
; // +10: start of translated string table
830 size_t32 nHashSize
, // +14: hash table size
831 ofsHashTable
; // +18: offset of hash table start
834 // all data is stored here
838 size_t32 m_numStrings
; // number of strings in this domain
839 wxMsgTableEntry
*m_pOrigTable
, // pointer to original strings
840 *m_pTransTable
; // translated
842 wxString m_charset
; // from the message catalog header
845 // swap the 2 halves of 32 bit integer if needed
846 size_t32
Swap(size_t32 ui
) const
848 return m_bSwapped
? (ui
<< 24) | ((ui
& 0xff00) << 8) |
849 ((ui
>> 8) & 0xff00) | (ui
>> 24)
853 const char *StringAtOfs(wxMsgTableEntry
*pTable
, size_t32 n
) const
855 const wxMsgTableEntry
* const ent
= pTable
+ n
;
857 // this check could fail for a corrupt message catalog
858 size_t32 ofsString
= Swap(ent
->ofsString
);
859 if ( ofsString
+ Swap(ent
->nLen
) > m_data
.length())
864 return m_data
.data() + ofsString
;
867 bool m_bSwapped
; // wrong endianness?
869 wxDECLARE_NO_COPY_CLASS(wxMsgCatalogFile
);
873 // ----------------------------------------------------------------------------
874 // wxMsgCatalog corresponds to one loaded message catalog.
876 // This is a "low-level" class and is used only by wxLocale (that's why
877 // it's designed to be stored in a linked list)
878 // ----------------------------------------------------------------------------
884 wxMsgCatalog() { m_conv
= NULL
; }
888 // load the catalog from disk
889 bool LoadFile(const wxString
& filename
,
890 const wxString
& domain
,
891 const wxString
& msgIdCharset
);
893 bool LoadData(const wxScopedCharTypeBuffer
<char>& data
,
894 const wxString
& domain
,
895 const wxString
& msgIdCharset
);
897 // get name of the catalog
898 wxString
GetDomain() const { return m_domain
; }
900 // get the translated string: returns NULL if not found
901 const wxString
*GetString(const wxString
& sz
, unsigned n
= UINT_MAX
) const;
903 // public variable pointing to the next element in a linked list (or NULL)
904 wxMsgCatalog
*m_pNext
;
907 wxMessagesHash m_messages
; // all messages in the catalog
908 wxString m_domain
; // name of the domain
911 // the conversion corresponding to this catalog charset if we installed it
916 wxPluralFormsCalculatorPtr m_pluralFormsCalculator
;
919 // ----------------------------------------------------------------------------
920 // wxMsgCatalogFile clas
921 // ----------------------------------------------------------------------------
923 wxMsgCatalogFile::wxMsgCatalogFile()
927 wxMsgCatalogFile::~wxMsgCatalogFile()
931 // open disk file and read in it's contents
932 bool wxMsgCatalogFile::LoadFile(const wxString
& filename
,
933 wxPluralFormsCalculatorPtr
& rPluralFormsCalculator
)
935 wxFile
fileMsg(filename
);
936 if ( !fileMsg
.IsOpened() )
939 // get the file size (assume it is less than 4Gb...)
940 wxFileOffset lenFile
= fileMsg
.Length();
941 if ( lenFile
== wxInvalidOffset
)
944 size_t nSize
= wx_truncate_cast(size_t, lenFile
);
945 wxASSERT_MSG( nSize
== lenFile
+ size_t(0), wxS("message catalog bigger than 4GB?") );
947 wxMemoryBuffer filedata
;
949 // read the whole file in memory
950 if ( fileMsg
.Read(filedata
.GetWriteBuf(nSize
), nSize
) != lenFile
)
953 filedata
.UngetWriteBuf(nSize
);
957 DataBuffer::CreateOwned((char*)filedata
.release(), nSize
),
958 rPluralFormsCalculator
962 wxLogWarning(_("'%s' is not a valid message catalog."), filename
.c_str());
970 bool wxMsgCatalogFile::LoadData(const DataBuffer
& data
,
971 wxPluralFormsCalculatorPtr
& rPluralFormsCalculator
)
974 bool bValid
= data
.length() > sizeof(wxMsgCatalogHeader
);
976 const wxMsgCatalogHeader
*pHeader
= (wxMsgCatalogHeader
*)data
.data();
978 // we'll have to swap all the integers if it's true
979 m_bSwapped
= pHeader
->magic
== MSGCATALOG_MAGIC_SW
;
981 // check the magic number
982 bValid
= m_bSwapped
|| pHeader
->magic
== MSGCATALOG_MAGIC
;
986 // it's either too short or has incorrect magic number
987 wxLogWarning(_("Invalid message catalog."));
994 m_numStrings
= Swap(pHeader
->numStrings
);
995 m_pOrigTable
= (wxMsgTableEntry
*)(data
.data() +
996 Swap(pHeader
->ofsOrigTable
));
997 m_pTransTable
= (wxMsgTableEntry
*)(data
.data() +
998 Swap(pHeader
->ofsTransTable
));
1000 // now parse catalog's header and try to extract catalog charset and
1001 // plural forms formula from it:
1003 const char* headerData
= StringAtOfs(m_pOrigTable
, 0);
1004 if ( headerData
&& headerData
[0] == '\0' )
1006 // Extract the charset:
1007 const char * const header
= StringAtOfs(m_pTransTable
, 0);
1009 cset
= strstr(header
, "Content-Type: text/plain; charset=");
1012 cset
+= 34; // strlen("Content-Type: text/plain; charset=")
1014 const char * const csetEnd
= strchr(cset
, '\n');
1017 m_charset
= wxString(cset
, csetEnd
- cset
);
1018 if ( m_charset
== wxS("CHARSET") )
1020 // "CHARSET" is not valid charset, but lazy translator
1025 // else: incorrectly filled Content-Type header
1027 // Extract plural forms:
1028 const char * plurals
= strstr(header
, "Plural-Forms:");
1031 plurals
+= 13; // strlen("Plural-Forms:")
1032 const char * const pluralsEnd
= strchr(plurals
, '\n');
1035 const size_t pluralsLen
= pluralsEnd
- plurals
;
1036 wxCharBuffer
buf(pluralsLen
);
1037 strncpy(buf
.data(), plurals
, pluralsLen
);
1038 wxPluralFormsCalculator
* const
1039 pCalculator
= wxPluralFormsCalculator::make(buf
);
1042 rPluralFormsCalculator
.reset(pCalculator
);
1046 wxLogVerbose(_("Failed to parse Plural-Forms: '%s'"),
1052 if ( !rPluralFormsCalculator
.get() )
1053 rPluralFormsCalculator
.reset(wxPluralFormsCalculator::make());
1056 // everything is fine
1060 bool wxMsgCatalogFile::FillHash(wxMessagesHash
& hash
,
1061 const wxString
& msgIdCharset
) const
1063 wxUnusedVar(msgIdCharset
); // silence warning in Unicode build
1065 // conversion to use to convert catalog strings to the GUI encoding
1066 wxMBConv
*inputConv
= NULL
;
1067 wxMBConv
*inputConvPtr
= NULL
; // same as inputConv but safely deleteable
1069 if ( !m_charset
.empty() )
1071 #if !wxUSE_UNICODE && wxUSE_FONTMAP
1072 // determine if we need any conversion at all
1073 wxFontEncoding encCat
= wxFontMapperBase::GetEncodingFromName(m_charset
);
1074 if ( encCat
!= wxLocale::GetSystemEncoding() )
1078 inputConv
= new wxCSConv(m_charset
);
1081 else // no need or not possible to convert the encoding
1084 // we must somehow convert the narrow strings in the message catalog to
1085 // wide strings, so use the default conversion if we have no charset
1086 inputConv
= wxConvCurrent
;
1091 // conversion to apply to msgid strings before looking them up: we only
1092 // need it if the msgids are neither in 7 bit ASCII nor in the same
1093 // encoding as the catalog
1094 wxCSConv
*sourceConv
= msgIdCharset
.empty() || (msgIdCharset
== m_charset
)
1096 : new wxCSConv(msgIdCharset
);
1097 #endif // !wxUSE_UNICODE
1099 for (size_t32 i
= 0; i
< m_numStrings
; i
++)
1101 const char *data
= StringAtOfs(m_pOrigTable
, i
);
1103 return false; // may happen for invalid MO files
1107 msgid
= wxString(data
, *inputConv
);
1109 if ( inputConv
&& sourceConv
)
1110 msgid
= wxString(inputConv
->cMB2WC(data
), *sourceConv
);
1113 #endif // wxUSE_UNICODE
1115 data
= StringAtOfs(m_pTransTable
, i
);
1117 return false; // may happen for invalid MO files
1119 size_t length
= Swap(m_pTransTable
[i
].nLen
);
1122 while (offset
< length
)
1124 const char * const str
= data
+ offset
;
1128 msgstr
= wxString(str
, *inputConv
);
1131 msgstr
= wxString(inputConv
->cMB2WC(str
), *wxConvUI
);
1134 #endif // wxUSE_UNICODE/!wxUSE_UNICODE
1136 if ( !msgstr
.empty() )
1138 hash
[index
== 0 ? msgid
: msgid
+ wxChar(index
)] = msgstr
;
1142 // IMPORTANT: accesses to the 'data' pointer are valid only for
1143 // the first 'length+1' bytes (GNU specs says that the
1144 // final NUL is not counted in length); using wxStrnlen()
1145 // we make sure we don't access memory beyond the valid range
1146 // (which otherwise may happen for invalid MO files):
1147 offset
+= wxStrnlen(str
, length
- offset
) + 1;
1155 delete inputConvPtr
;
1161 // ----------------------------------------------------------------------------
1162 // wxMsgCatalog class
1163 // ----------------------------------------------------------------------------
1166 wxMsgCatalog::~wxMsgCatalog()
1170 if ( wxConvUI
== m_conv
)
1172 // we only change wxConvUI if it points to wxConvLocal so we reset
1173 // it back to it too
1174 wxConvUI
= &wxConvLocal
;
1180 #endif // !wxUSE_UNICODE
1182 bool wxMsgCatalog::LoadFile(const wxString
& filename
,
1183 const wxString
& domain
,
1184 const wxString
& msgIdCharset
)
1186 wxMsgCatalogFile file
;
1190 if ( !file
.LoadFile(filename
, m_pluralFormsCalculator
) )
1193 if ( !file
.FillHash(m_messages
, msgIdCharset
) )
1199 bool wxMsgCatalog::LoadData(const wxScopedCharTypeBuffer
<char>& data
,
1200 const wxString
& domain
,
1201 const wxString
& msgIdCharset
)
1203 wxMsgCatalogFile file
;
1207 if ( !file
.LoadData(data
, m_pluralFormsCalculator
) )
1210 if ( !file
.FillHash(m_messages
, msgIdCharset
) )
1216 const wxString
*wxMsgCatalog::GetString(const wxString
& str
, unsigned n
) const
1221 index
= m_pluralFormsCalculator
->evaluate(n
);
1223 wxMessagesHash::const_iterator i
;
1226 i
= m_messages
.find(wxString(str
) + wxChar(index
)); // plural
1230 i
= m_messages
.find(str
);
1233 if ( i
!= m_messages
.end() )
1242 // ----------------------------------------------------------------------------
1244 // ----------------------------------------------------------------------------
1249 wxTranslations
*gs_translations
= NULL
;
1250 bool gs_translationsOwned
= false;
1252 } // anonymous namespace
1256 wxTranslations
*wxTranslations::Get()
1258 return gs_translations
;
1262 void wxTranslations::Set(wxTranslations
*t
)
1264 if ( gs_translationsOwned
)
1265 delete gs_translations
;
1266 gs_translations
= t
;
1267 gs_translationsOwned
= true;
1271 void wxTranslations::SetNonOwned(wxTranslations
*t
)
1273 if ( gs_translationsOwned
)
1274 delete gs_translations
;
1275 gs_translations
= t
;
1276 gs_translationsOwned
= false;
1280 wxTranslations::wxTranslations()
1283 m_loader
= new wxFileTranslationsLoader
;
1287 wxTranslations::~wxTranslations()
1291 // free catalogs memory
1292 wxMsgCatalog
*pTmpCat
;
1293 while ( m_pMsgCat
!= NULL
)
1295 pTmpCat
= m_pMsgCat
;
1296 m_pMsgCat
= m_pMsgCat
->m_pNext
;
1302 void wxTranslations::SetLoader(wxTranslationsLoader
*loader
)
1304 wxCHECK_RET( loader
, "loader can't be NULL" );
1311 void wxTranslations::SetLanguage(wxLanguage lang
)
1313 if ( lang
== wxLANGUAGE_DEFAULT
)
1316 SetLanguage(wxLocale::GetLanguageCanonicalName(lang
));
1319 void wxTranslations::SetLanguage(const wxString
& lang
)
1325 bool wxTranslations::AddStdCatalog()
1327 if ( !AddCatalog(wxS("wxstd")) )
1330 // there may be a catalog with toolkit specific overrides, it is not
1331 // an error if this does not exist
1332 wxString
port(wxPlatformInfo::Get().GetPortIdName());
1333 if ( !port
.empty() )
1335 AddCatalog(port
.BeforeFirst(wxS('/')).MakeLower());
1342 bool wxTranslations::AddCatalog(const wxString
& domain
)
1344 return AddCatalog(domain
, wxLANGUAGE_ENGLISH_US
);
1348 bool wxTranslations::AddCatalog(const wxString
& domain
,
1349 wxLanguage msgIdLanguage
,
1350 const wxString
& msgIdCharset
)
1352 m_msgIdCharset
[domain
] = msgIdCharset
;
1353 return AddCatalog(domain
, msgIdLanguage
);
1355 #endif // !wxUSE_UNICODE
1357 bool wxTranslations::AddCatalog(const wxString
& domain
,
1358 wxLanguage msgIdLanguage
)
1360 const wxString msgIdLang
= wxLocale::GetLanguageCanonicalName(msgIdLanguage
);
1361 const wxString domain_lang
= ChooseLanguageForDomain(domain
, msgIdLang
);
1363 if ( domain_lang
.empty() )
1365 wxLogTrace(TRACE_I18N
,
1366 wxS("no suitable translation for domain '%s' found"),
1371 wxLogTrace(TRACE_I18N
,
1372 wxS("adding '%s' translation for domain '%s' (msgid language '%s')"),
1373 domain_lang
, domain
, msgIdLang
);
1375 // It is OK to not load catalog if the msgid language and m_language match,
1376 // in which case we can directly display the texts embedded in program's
1378 if ( msgIdLang
== domain_lang
)
1381 return LoadCatalog(domain
, domain_lang
);
1385 bool wxTranslations::LoadCatalog(const wxString
& domain
, const wxString
& lang
)
1387 wxCHECK_MSG( m_loader
, false, "loader can't be NULL" );
1390 // first look for the catalog for this language and the current locale:
1391 // notice that we don't use the system name for the locale as this would
1392 // force us to install catalogs in different locations depending on the
1393 // system but always use the canonical name
1394 wxFontEncoding encSys
= wxLocale::GetSystemEncoding();
1395 if ( encSys
!= wxFONTENCODING_SYSTEM
)
1397 wxString
fullname(lang
);
1398 fullname
<< wxS('.') << wxFontMapperBase::GetEncodingName(encSys
);
1400 if ( m_loader
->LoadCatalog(this, domain
, fullname
) )
1403 #endif // wxUSE_FONTMAP
1405 // Next try: use the provided name language name:
1406 if ( m_loader
->LoadCatalog(this, domain
, lang
) )
1409 // Also try just base locale name: for things like "fr_BE" (Belgium
1410 // French) we should use fall back on plain "fr" if no Belgium-specific
1411 // message catalogs exist
1412 wxString baselang
= lang
.BeforeFirst('_');
1413 if ( lang
!= baselang
)
1415 if ( m_loader
->LoadCatalog(this, domain
, baselang
) )
1419 // Nothing worked, the catalog just isn't there
1420 wxLogTrace(TRACE_I18N
,
1421 "Catalog \"%s.mo\" not found for language \"%s\".",
1427 // check if the given catalog is loaded
1428 bool wxTranslations::IsLoaded(const wxString
& domain
) const
1430 return FindCatalog(domain
) != NULL
;
1434 bool wxTranslations::LoadCatalogFile(const wxString
& filename
,
1435 const wxString
& domain
)
1437 wxMsgCatalog
*pMsgCat
= new wxMsgCatalog
;
1440 const bool ok
= pMsgCat
->LoadFile(filename
, domain
, wxEmptyString
/*unused*/);
1442 const bool ok
= pMsgCat
->LoadFile(filename
, domain
,
1443 m_msgIdCharset
[domain
]);
1448 // don't add it because it couldn't be loaded anyway
1453 // add it to the head of the list so that in GetString it will
1454 // be searched before the catalogs added earlier
1455 pMsgCat
->m_pNext
= m_pMsgCat
;
1456 m_pMsgCat
= pMsgCat
;
1462 bool wxTranslations::LoadCatalogData(const wxScopedCharTypeBuffer
<char>& data
,
1463 const wxString
& domain
)
1465 wxMsgCatalog
*pMsgCat
= new wxMsgCatalog
;
1468 const bool ok
= pMsgCat
->LoadData(data
, domain
, wxEmptyString
/*unused*/);
1470 const bool ok
= pMsgCat
->LoadData(data
, domain
,
1471 m_msgIdCharset
[domain
]);
1476 // don't add it because it couldn't be loaded anyway
1481 // add it to the head of the list so that in GetString it will
1482 // be searched before the catalogs added earlier
1483 pMsgCat
->m_pNext
= m_pMsgCat
;
1484 m_pMsgCat
= pMsgCat
;
1490 wxString
wxTranslations::ChooseLanguageForDomain(const wxString
& WXUNUSED(domain
),
1491 const wxString
& WXUNUSED(msgIdLang
))
1493 // explicitly set language should always be respected
1494 if ( !m_lang
.empty() )
1497 // TODO: if the default language is used, pick the best (by comparing
1498 // available languages with user's preferences), instead of blindly
1499 // trusting availability of system language translation
1500 return wxLocale::GetLanguageCanonicalName(wxLocale::GetSystemLanguage());
1506 WX_DECLARE_HASH_SET(wxString
, wxStringHash
, wxStringEqual
,
1507 wxLocaleUntranslatedStrings
);
1511 const wxString
& wxTranslations::GetUntranslatedString(const wxString
& str
)
1513 static wxLocaleUntranslatedStrings s_strings
;
1515 wxLocaleUntranslatedStrings::iterator i
= s_strings
.find(str
);
1516 if ( i
== s_strings
.end() )
1517 return *s_strings
.insert(str
).first
;
1523 const wxString
& wxTranslations::GetString(const wxString
& origString
,
1524 const wxString
& domain
) const
1526 return GetString(origString
, origString
, UINT_MAX
, domain
);
1529 const wxString
& wxTranslations::GetString(const wxString
& origString
,
1530 const wxString
& origString2
,
1532 const wxString
& domain
) const
1534 if ( origString
.empty() )
1535 return GetUntranslatedString(origString
);
1537 const wxString
*trans
= NULL
;
1538 wxMsgCatalog
*pMsgCat
;
1540 if ( !domain
.empty() )
1542 pMsgCat
= FindCatalog(domain
);
1544 // does the catalog exist?
1545 if ( pMsgCat
!= NULL
)
1546 trans
= pMsgCat
->GetString(origString
, n
);
1550 // search in all domains
1551 for ( pMsgCat
= m_pMsgCat
; pMsgCat
!= NULL
; pMsgCat
= pMsgCat
->m_pNext
)
1553 trans
= pMsgCat
->GetString(origString
, n
);
1554 if ( trans
!= NULL
) // take the first found
1559 if ( trans
== NULL
)
1564 "string \"%s\"%s not found in %slocale '%s'.",
1566 ((long)n
) != -1 ? wxString::Format("[%ld]", (long)n
) : wxString(),
1567 !domain
.empty() ? wxString::Format("domain '%s' ", domain
) : wxString(),
1572 return GetUntranslatedString(origString
);
1574 return GetUntranslatedString(n
== 1 ? origString
: origString2
);
1581 wxString
wxTranslations::GetHeaderValue(const wxString
& header
,
1582 const wxString
& domain
) const
1584 if ( header
.empty() )
1585 return wxEmptyString
;
1587 const wxString
*trans
= NULL
;
1588 wxMsgCatalog
*pMsgCat
;
1590 if ( !domain
.empty() )
1592 pMsgCat
= FindCatalog(domain
);
1594 // does the catalog exist?
1595 if ( pMsgCat
== NULL
)
1596 return wxEmptyString
;
1598 trans
= pMsgCat
->GetString(wxEmptyString
, UINT_MAX
);
1602 // search in all domains
1603 for ( pMsgCat
= m_pMsgCat
; pMsgCat
!= NULL
; pMsgCat
= pMsgCat
->m_pNext
)
1605 trans
= pMsgCat
->GetString(wxEmptyString
, UINT_MAX
);
1606 if ( trans
!= NULL
) // take the first found
1611 if ( !trans
|| trans
->empty() )
1612 return wxEmptyString
;
1614 size_t found
= trans
->find(header
);
1615 if ( found
== wxString::npos
)
1616 return wxEmptyString
;
1618 found
+= header
.length() + 2 /* ': ' */;
1620 // Every header is separated by \n
1622 size_t endLine
= trans
->find(wxS('\n'), found
);
1623 size_t len
= (endLine
== wxString::npos
) ?
1624 wxString::npos
: (endLine
- found
);
1626 return trans
->substr(found
, len
);
1630 // find catalog by name in a linked list, return NULL if !found
1631 wxMsgCatalog
*wxTranslations::FindCatalog(const wxString
& domain
) const
1633 // linear search in the linked list
1634 wxMsgCatalog
*pMsgCat
;
1635 for ( pMsgCat
= m_pMsgCat
; pMsgCat
!= NULL
; pMsgCat
= pMsgCat
->m_pNext
)
1637 if ( pMsgCat
->GetDomain() == domain
)
1644 // ----------------------------------------------------------------------------
1645 // wxFileTranslationsLoader
1646 // ----------------------------------------------------------------------------
1651 // the list of the directories to search for message catalog files
1652 wxArrayString gs_searchPrefixes
;
1654 // return the directories to search for message catalogs under the given
1655 // prefix, separated by wxPATH_SEP
1656 wxString
GetMsgCatalogSubdirs(const wxString
& prefix
, const wxString
& lang
)
1658 // Search first in Unix-standard prefix/lang/LC_MESSAGES, then in
1659 // prefix/lang and finally in just prefix.
1661 // Note that we use LC_MESSAGES on all platforms and not just Unix, because
1662 // it doesn't cost much to look into one more directory and doing it this
1663 // way has two important benefits:
1664 // a) we don't break compatibility with wx-2.6 and older by stopping to
1665 // look in a directory where the catalogs used to be and thus silently
1666 // breaking apps after they are recompiled against the latest wx
1667 // b) it makes it possible to package app's support files in the same
1668 // way on all target platforms
1669 const wxString pathPrefix
= wxFileName(prefix
, lang
).GetFullPath();
1671 wxString searchPath
;
1672 searchPath
.reserve(4*pathPrefix
.length());
1673 searchPath
<< pathPrefix
<< wxFILE_SEP_PATH
<< "LC_MESSAGES" << wxPATH_SEP
1674 << prefix
<< wxFILE_SEP_PATH
<< wxPATH_SEP
1680 // construct the search path for the given language
1681 static wxString
GetFullSearchPath(const wxString
& lang
)
1683 // first take the entries explicitly added by the program
1684 wxArrayString paths
;
1685 paths
.reserve(gs_searchPrefixes
.size() + 1);
1687 count
= gs_searchPrefixes
.size();
1688 for ( n
= 0; n
< count
; n
++ )
1690 paths
.Add(GetMsgCatalogSubdirs(gs_searchPrefixes
[n
], lang
));
1695 // then look in the standard location
1696 const wxString stdp
= wxStandardPaths::Get().
1697 GetLocalizedResourcesDir(lang
, wxStandardPaths::ResourceCat_Messages
);
1699 if ( paths
.Index(stdp
) == wxNOT_FOUND
)
1701 #endif // wxUSE_STDPATHS
1703 // last look in default locations
1705 // LC_PATH is a standard env var containing the search path for the .mo
1707 const char *pszLcPath
= wxGetenv("LC_PATH");
1710 const wxString lcp
= GetMsgCatalogSubdirs(pszLcPath
, lang
);
1711 if ( paths
.Index(lcp
) == wxNOT_FOUND
)
1715 // also add the one from where wxWin was installed:
1716 wxString wxp
= wxGetInstallPrefix();
1719 wxp
= GetMsgCatalogSubdirs(wxp
+ wxS("/share/locale"), lang
);
1720 if ( paths
.Index(wxp
) == wxNOT_FOUND
)
1726 // finally construct the full search path
1727 wxString searchPath
;
1728 searchPath
.reserve(500);
1729 count
= paths
.size();
1730 for ( n
= 0; n
< count
; n
++ )
1732 searchPath
+= paths
[n
];
1733 if ( n
!= count
- 1 )
1734 searchPath
+= wxPATH_SEP
;
1740 } // anonymous namespace
1743 void wxFileTranslationsLoader::AddCatalogLookupPathPrefix(const wxString
& prefix
)
1745 if ( gs_searchPrefixes
.Index(prefix
) == wxNOT_FOUND
)
1747 gs_searchPrefixes
.Add(prefix
);
1749 //else: already have it
1753 bool wxFileTranslationsLoader::LoadCatalog(wxTranslations
*translations
,
1754 const wxString
& domain
,
1755 const wxString
& lang
)
1757 wxString searchPath
= GetFullSearchPath(lang
);
1759 wxLogTrace(TRACE_I18N
, wxS("Looking for \"%s.mo\" in search path \"%s\""),
1760 domain
, searchPath
);
1762 wxFileName
fn(domain
);
1763 fn
.SetExt(wxS("mo"));
1765 wxString strFullName
;
1766 if ( !wxFindFileInPath(&strFullName
, searchPath
, fn
.GetFullPath()) )
1769 // open file and read its data
1770 wxLogVerbose(_("using catalog '%s' from '%s'."), domain
, strFullName
.c_str());
1771 wxLogTrace(TRACE_I18N
, wxS("Using catalog \"%s\"."), strFullName
.c_str());
1773 return translations
->LoadCatalogFile(strFullName
, domain
);
1777 // ----------------------------------------------------------------------------
1778 // wxResourceTranslationsLoader
1779 // ----------------------------------------------------------------------------
1782 bool wxResourceTranslationsLoader::LoadCatalog(wxTranslations
*translations
,
1783 const wxString
& domain
,
1784 const wxString
& lang
)
1787 const void *mo_data
= NULL
;
1790 const wxString resname
= wxString::Format("%s_%s", domain
, lang
);
1792 if ( !wxLoadUserResource(&mo_data
, &mo_size
,
1798 wxLogTrace(TRACE_I18N
,
1799 "Using catalog from Windows resource \"%s\".", resname
);
1801 const bool ok
= translations
->LoadCatalogData(
1802 wxCharBuffer::CreateNonOwned(static_cast<const char*>(mo_data
), mo_size
));
1804 wxLogWarning(_("Resource '%s' is not a valid message catalog."), resname
);
1808 #endif // __WINDOWS__
1811 // ----------------------------------------------------------------------------
1812 // wxTranslationsModule module (for destruction of gs_translations)
1813 // ----------------------------------------------------------------------------
1815 class wxTranslationsModule
: public wxModule
1817 DECLARE_DYNAMIC_CLASS(wxTranslationsModule
)
1819 wxTranslationsModule() {}
1828 if ( gs_translationsOwned
)
1829 delete gs_translations
;
1830 gs_translations
= NULL
;
1831 gs_translationsOwned
= true;
1835 IMPLEMENT_DYNAMIC_CLASS(wxTranslationsModule
, wxModule
)
1837 #endif // wxUSE_INTL