]> git.saurik.com Git - wxWidgets.git/blame_incremental - src/common/intl.cpp
just some comments
[wxWidgets.git] / src / common / intl.cpp
... / ...
CommitLineData
1/////////////////////////////////////////////////////////////////////////////
2// Name: intl.cpp
3// Purpose: Internationalization and localisation for wxWindows
4// Author: Vadim Zeitlin
5// Modified by:
6// Created: 29/01/98
7// RCS-ID: $Id$
8// Copyright: (c) 1998 Vadim Zeitlin <zeitlin@dptmaths.ens-cachan.fr>
9// Licence: wxWindows license
10/////////////////////////////////////////////////////////////////////////////
11
12// ============================================================================
13// declaration
14// ============================================================================
15
16// ----------------------------------------------------------------------------
17// headers
18// ----------------------------------------------------------------------------
19
20#ifdef __GNUG__
21 #pragma implementation "intl.h"
22#endif
23
24// For compilers that support precompilation, includes "wx.h".
25#include "wx/wxprec.h"
26
27#ifdef __BORLANDC__
28 #pragma hdrstop
29#endif
30
31#if wxUSE_INTL
32
33// standard headers
34#include <locale.h>
35#include <ctype.h>
36
37// wxWindows
38#include "wx/defs.h"
39#include "wx/string.h"
40#include "wx/intl.h"
41#include "wx/file.h"
42#include "wx/log.h"
43#include "wx/debug.h"
44#include "wx/utils.h"
45
46#include <stdlib.h>
47
48// ----------------------------------------------------------------------------
49// simple types
50// ----------------------------------------------------------------------------
51
52// this should *not* be wxChar, this type must have exactly 8 bits!
53typedef unsigned char size_t8;
54
55#ifdef __WXMSW__
56 #if defined(__WIN16__)
57 typedef unsigned long size_t32;
58 #elif defined(__WIN32__)
59 typedef unsigned int size_t32;
60 #else
61 // Win64 will have different type sizes
62 #error "Please define a 32 bit type"
63 #endif
64#else // !Windows
65 // SIZEOF_XXX are defined by configure
66 #if defined(SIZEOF_INT) && (SIZEOF_INT == 4)
67 typedef unsigned int size_t32;
68 #elif defined(SIZEOF_LONG) && (SIZEOF_LONG == 4)
69 typedef unsigned long size_t32;
70 #else
71 // assume sizeof(int) == 4 - what else can we do
72 typedef unsigned int size_t32;
73
74 // ... but at least check it during run time
75 static class IntSizeChecker
76 {
77 public:
78 IntSizeChecker()
79 {
80 // Asserting a sizeof directly causes some compilers to
81 // issue a "using constant in a conditional expression" warning
82 size_t intsize = sizeof(int);
83
84 wxASSERT_MSG( intsize == 4,
85 "size_t32 is incorrectly defined!" );
86 }
87 } intsizechecker;
88 #endif
89#endif // Win/!Win
90
91// ----------------------------------------------------------------------------
92// constants
93// ----------------------------------------------------------------------------
94
95// magic number identifying the .mo format file
96const size_t32 MSGCATALOG_MAGIC = 0x950412de;
97const size_t32 MSGCATALOG_MAGIC_SW = 0xde120495;
98
99// extension of ".mo" files
100#define MSGCATALOG_EXTENSION ".mo"
101
102// ----------------------------------------------------------------------------
103// global functions
104// ----------------------------------------------------------------------------
105
106// suppress further error messages about missing translations
107// (if you don't have one catalog file, you wouldn't like to see the
108// error message for each string in it, so normally it's given only
109// once)
110void wxSuppressTransErrors();
111
112// restore the logging
113void wxRestoreTransErrors();
114
115// get the current state
116bool wxIsLoggingTransErrors();
117
118static wxLocale *wxSetLocale(wxLocale *pLocale);
119
120// ----------------------------------------------------------------------------
121// wxMsgCatalog corresponds to one disk-file message catalog.
122//
123// This is a "low-level" class and is used only by wxLocale (that's why
124// it's designed to be stored in a linked list)
125// ----------------------------------------------------------------------------
126
127class wxMsgCatalog
128{
129public:
130 // ctor & dtor
131 wxMsgCatalog();
132 ~wxMsgCatalog();
133
134 // load the catalog from disk (szDirPrefix corresponds to language)
135 bool Load(const wxChar *szDirPrefix, const wxChar *szName, bool bConvertEncoding = FALSE);
136 bool IsLoaded() const { return m_pData != NULL; }
137
138 // get name of the catalog
139 const wxChar *GetName() const { return m_pszName; }
140
141 // get the translated string: returns NULL if not found
142 const char *GetString(const char *sz) const;
143
144 // public variable pointing to the next element in a linked list (or NULL)
145 wxMsgCatalog *m_pNext;
146
147private:
148 // this implementation is binary compatible with GNU gettext() version 0.10
149
150 // an entry in the string table
151 struct wxMsgTableEntry
152 {
153 size_t32 nLen; // length of the string
154 size_t32 ofsString; // pointer to the string
155 };
156
157 // header of a .mo file
158 struct wxMsgCatalogHeader
159 {
160 size_t32 magic, // offset +00: magic id
161 revision, // +04: revision
162 numStrings; // +08: number of strings in the file
163 size_t32 ofsOrigTable, // +0C: start of original string table
164 ofsTransTable; // +10: start of translated string table
165 size_t32 nHashSize, // +14: hash table size
166 ofsHashTable; // +18: offset of hash table start
167 };
168
169 // all data is stored here, NULL if no data loaded
170 size_t8 *m_pData;
171
172 // data description
173 size_t32 m_numStrings, // number of strings in this domain
174 m_nHashSize; // number of entries in hash table
175 size_t32 *m_pHashTable; // pointer to hash table
176 wxMsgTableEntry *m_pOrigTable, // pointer to original strings
177 *m_pTransTable; // translated
178
179 const char *StringAtOfs(wxMsgTableEntry *pTable, size_t32 index) const
180 { return (const char *)(m_pData + Swap(pTable[index].ofsString)); }
181
182 // convert encoding to platform native one, if neccessary
183 void ConvertEncoding();
184
185 // utility functions
186 // calculate the hash value of given string
187 static inline size_t32 GetHash(const char *sz);
188 // big<->little endian
189 inline size_t32 Swap(size_t32 ui) const;
190
191 // internal state
192 bool HasHashTable() const // true if hash table is present
193 { return m_nHashSize > 2 && m_pHashTable != NULL; }
194
195 bool m_bSwapped; // wrong endianness?
196
197 wxChar *m_pszName; // name of the domain
198};
199
200// ----------------------------------------------------------------------------
201// global variables
202// ----------------------------------------------------------------------------
203
204// the list of the directories to search for message catalog files
205static wxArrayString s_searchPrefixes;
206
207// ============================================================================
208// implementation
209// ============================================================================
210
211// ----------------------------------------------------------------------------
212// wxMsgCatalog class
213// ----------------------------------------------------------------------------
214
215// calculate hash value using the so called hashpjw function by P.J. Weinberger
216// [see Aho/Sethi/Ullman, COMPILERS: Principles, Techniques and Tools]
217size_t32 wxMsgCatalog::GetHash(const char *sz)
218{
219 #define HASHWORDBITS 32 // the length of size_t32
220
221 size_t32 hval = 0;
222 size_t32 g;
223 while ( *sz != '\0' ) {
224 hval <<= 4;
225 hval += (size_t32)*sz++;
226 g = hval & ((size_t32)0xf << (HASHWORDBITS - 4));
227 if ( g != 0 ) {
228 hval ^= g >> (HASHWORDBITS - 8);
229 hval ^= g;
230 }
231 }
232
233 return hval;
234}
235
236// swap the 2 halves of 32 bit integer if needed
237size_t32 wxMsgCatalog::Swap(size_t32 ui) const
238{
239 return m_bSwapped ? (ui << 24) | ((ui & 0xff00) << 8) |
240 ((ui >> 8) & 0xff00) | (ui >> 24)
241 : ui;
242}
243
244wxMsgCatalog::wxMsgCatalog()
245{
246 m_pData = NULL;
247 m_pszName = NULL;
248}
249
250wxMsgCatalog::~wxMsgCatalog()
251{
252 wxDELETEA(m_pData);
253 wxDELETEA(m_pszName);
254}
255
256// small class to suppress the translation erros until exit from current scope
257class NoTransErr
258{
259public:
260 NoTransErr() { wxSuppressTransErrors(); }
261 ~NoTransErr() { wxRestoreTransErrors(); }
262};
263
264// return all directories to search for given prefix
265static wxString GetAllMsgCatalogSubdirs(const wxChar *prefix,
266 const wxChar *lang)
267{
268 wxString searchPath;
269
270 // search first in prefix/fr/LC_MESSAGES, then in prefix/fr and finally in
271 // prefix (assuming the language is 'fr')
272 searchPath << prefix << wxFILE_SEP_PATH << lang << wxFILE_SEP_PATH
273 << wxT("LC_MESSAGES") << wxPATH_SEP
274 << prefix << wxFILE_SEP_PATH << lang << wxPATH_SEP
275 << prefix << wxPATH_SEP;
276
277 return searchPath;
278}
279
280// construct the search path for the given language
281static wxString GetFullSearchPath(const wxChar *lang)
282{
283 wxString searchPath;
284
285 // first take the entries explicitly added by the program
286 size_t count = s_searchPrefixes.Count();
287 for ( size_t n = 0; n < count; n++ )
288 {
289 searchPath << GetAllMsgCatalogSubdirs(s_searchPrefixes[n], lang)
290 << wxPATH_SEP;
291 }
292
293 // then take the current directory
294 // FIXME it should be the directory of the executable
295 searchPath << GetAllMsgCatalogSubdirs(wxT("."), lang) << wxPATH_SEP;
296
297 // and finally add some standard ones
298 searchPath
299 << GetAllMsgCatalogSubdirs(wxT("/usr/share/locale"), lang) << wxPATH_SEP
300 << GetAllMsgCatalogSubdirs(wxT("/usr/lib/locale"), lang) << wxPATH_SEP
301 << GetAllMsgCatalogSubdirs(wxT("/usr/local/share/locale"), lang);
302
303 return searchPath;
304}
305
306// open disk file and read in it's contents
307bool wxMsgCatalog::Load(const wxChar *szDirPrefix, const wxChar *szName0, bool bConvertEncoding)
308{
309 /* We need to handle locales like de_AT.iso-8859-1
310 For this we first chop off the .CHARSET specifier and ignore it.
311 FIXME: UNICODE SUPPORT: must use CHARSET specifier!
312 */
313 wxString szName = szName0;
314 if(szName.Find(wxT('.')) != -1) // contains a dot
315 szName = szName.Left(szName.Find(wxT('.')));
316
317 // FIXME VZ: I forgot the exact meaning of LC_PATH - anyone to remind me?
318 // KB: search path where to find the mo files, probably : delimited
319#if 0
320 const wxChar *pszLcPath = wxGetenv("LC_PATH");
321 if ( pszLcPath != NULL )
322 strPath += pszLcPath + wxString(szDirPrefix) + MSG_PATH;
323#endif // 0
324
325 wxString searchPath = GetFullSearchPath(szDirPrefix);
326 const wxChar *sublocale = wxStrchr(szDirPrefix, wxT('_'));
327 if ( sublocale )
328 {
329 // also add just base locale name: for things like "fr_BE" (belgium
330 // french) we should use "fr" if no belgium specific message catalogs
331 // exist
332 searchPath << GetFullSearchPath(wxString(szDirPrefix).
333 Left((size_t)(sublocale - szDirPrefix)))
334 << wxPATH_SEP;
335 }
336
337 wxString strFile = szName;
338 strFile += MSGCATALOG_EXTENSION;
339
340 // don't give translation errors here because the wxstd catalog might
341 // not yet be loaded (and it's normal)
342 //
343 // (we're using an object because we have several return paths)
344
345 NoTransErr noTransErr;
346 wxLogVerbose(wxT("looking for catalog '%s' in path '%s'."),
347 szName.c_str(), searchPath.c_str());
348
349 wxString strFullName;
350 if ( !wxFindFileInPath(&strFullName, searchPath, strFile) ) {
351 wxLogWarning(_("catalog file for domain '%s' not found."), szName.c_str());
352 return FALSE;
353 }
354
355 // open file
356 wxLogVerbose(_("using catalog '%s' from '%s'."),
357 szName.c_str(), strFullName.c_str());
358
359 wxFile fileMsg(strFullName);
360 if ( !fileMsg.IsOpened() )
361 return FALSE;
362
363 // get the file size
364 off_t nSize = fileMsg.Length();
365 if ( nSize == wxInvalidOffset )
366 return FALSE;
367
368 // read the whole file in memory
369 m_pData = new size_t8[nSize];
370 if ( fileMsg.Read(m_pData, nSize) != nSize ) {
371 wxDELETEA(m_pData);
372 return FALSE;
373 }
374
375 // examine header
376 bool bValid = (size_t)nSize > sizeof(wxMsgCatalogHeader);
377
378 wxMsgCatalogHeader *pHeader = (wxMsgCatalogHeader *)m_pData;
379 if ( bValid ) {
380 // we'll have to swap all the integers if it's true
381 m_bSwapped = pHeader->magic == MSGCATALOG_MAGIC_SW;
382
383 // check the magic number
384 bValid = m_bSwapped || pHeader->magic == MSGCATALOG_MAGIC;
385 }
386
387 if ( !bValid ) {
388 // it's either too short or has incorrect magic number
389 wxLogWarning(_("'%s' is not a valid message catalog."), strFullName.c_str());
390
391 wxDELETEA(m_pData);
392 return FALSE;
393 }
394
395 // initialize
396 m_numStrings = Swap(pHeader->numStrings);
397 m_pOrigTable = (wxMsgTableEntry *)(m_pData +
398 Swap(pHeader->ofsOrigTable));
399 m_pTransTable = (wxMsgTableEntry *)(m_pData +
400 Swap(pHeader->ofsTransTable));
401
402 m_nHashSize = Swap(pHeader->nHashSize);
403 m_pHashTable = (size_t32 *)(m_pData + Swap(pHeader->ofsHashTable));
404
405 m_pszName = new wxChar[wxStrlen(szName) + 1];
406 wxStrcpy(m_pszName, szName);
407
408 if (bConvertEncoding) ConvertEncoding();
409
410 // everything is fine
411 return TRUE;
412}
413
414// search for a string
415const char *wxMsgCatalog::GetString(const char *szOrig) const
416{
417 if ( szOrig == NULL )
418 return NULL;
419
420 if ( HasHashTable() ) { // use hash table for lookup if possible
421 size_t32 nHashVal = GetHash(szOrig);
422 size_t32 nIndex = nHashVal % m_nHashSize;
423
424 size_t32 nIncr = 1 + (nHashVal % (m_nHashSize - 2));
425
426#if defined(__VISAGECPP__)
427// VA just can't stand while(1) or while(TRUE)
428 bool bOs2var = TRUE;
429 while(bOs2var) {
430#else
431 while (1) {
432#endif
433 size_t32 nStr = Swap(m_pHashTable[nIndex]);
434 if ( nStr == 0 )
435 return NULL;
436
437 if ( strcmp(szOrig, StringAtOfs(m_pOrigTable, nStr - 1)) == 0 )
438 return StringAtOfs(m_pTransTable, nStr - 1);
439
440 if ( nIndex >= m_nHashSize - nIncr)
441 nIndex -= m_nHashSize - nIncr;
442 else
443 nIndex += nIncr;
444 }
445 }
446 else { // no hash table: use default binary search
447 size_t32 bottom = 0,
448 top = m_numStrings,
449 current;
450 while ( bottom < top ) {
451 current = (bottom + top) / 2;
452 int res = strcmp(szOrig, StringAtOfs(m_pOrigTable, current));
453 if ( res < 0 )
454 top = current;
455 else if ( res > 0 )
456 bottom = current + 1;
457 else // found!
458 return StringAtOfs(m_pTransTable, current);
459 }
460 }
461
462 // not found
463 return NULL;
464}
465
466
467#if wxUSE_GUI
468#include "wx/fontmap.h"
469#include "wx/encconv.h"
470#endif
471
472void wxMsgCatalog::ConvertEncoding()
473{
474#if wxUSE_GUI
475 wxFontEncoding enc;
476
477 // first, find encoding header:
478 const char *hdr = StringAtOfs(m_pOrigTable, 0);
479 if (hdr == NULL) return; // not supported by this catalog, does not have non-fuzzy header
480 if (hdr[0] != 0) return; // ditto
481
482 /* we support catalogs with header (msgid "") that is _not_ marked as "#, fuzzy" (otherwise
483 the string would not be included into compiled catalog) */
484 wxString header(StringAtOfs(m_pTransTable, 0));
485 wxString charset;
486 int pos = header.Find(wxT("Content-Type: text/plain; charset="));
487 if (pos == wxNOT_FOUND)
488 return; // incorrectly filled Content-Type header
489 size_t n = pos + 34; /*strlen("Content-Type: text/plain; charset=")*/
490 while (header[n] != wxT('\n'))
491 charset << header[n++];
492
493 enc = wxTheFontMapper->CharsetToEncoding(charset, FALSE);
494 if ( enc == wxFONTENCODING_SYSTEM )
495 return; // unknown encoding
496
497 wxFontEncodingArray a = wxEncodingConverter::GetPlatformEquivalents(enc);
498 if (a[0] == enc)
499 return; // no conversion needed, locale uses native encoding
500
501 if (a.GetCount() == 0)
502 return; // we don't know common equiv. under this platform
503
504 wxEncodingConverter converter;
505
506 converter.Init(enc, a[0]);
507 for (size_t i = 0; i < m_numStrings; i++)
508 converter.Convert((char*)StringAtOfs(m_pTransTable, i));
509#endif
510}
511
512
513// ----------------------------------------------------------------------------
514// wxLocale
515// ----------------------------------------------------------------------------
516
517wxLocale::wxLocale()
518{
519 m_pszOldLocale = NULL;
520 m_pMsgCat = NULL;
521}
522
523// NB: this function has (desired) side effect of changing current locale
524bool wxLocale::Init(const wxChar *szName,
525 const wxChar *szShort,
526 const wxChar *szLocale,
527 bool bLoadDefault,
528 bool bConvertEncoding)
529{
530 m_strLocale = szName;
531 m_strShort = szShort;
532 m_bConvertEncoding = bConvertEncoding;
533
534 // change current locale (default: same as long name)
535 if ( szLocale == NULL )
536 {
537 // the argument to setlocale()
538 szLocale = szShort;
539 }
540 m_pszOldLocale = wxSetlocale(LC_ALL, szLocale);
541 if ( m_pszOldLocale == NULL )
542 wxLogError(_("locale '%s' can not be set."), szLocale);
543
544 // the short name will be used to look for catalog files as well,
545 // so we need something here
546 if ( m_strShort.IsEmpty() ) {
547 // FIXME I don't know how these 2 letter abbreviations are formed,
548 // this wild guess is surely wrong
549 m_strShort = tolower(szLocale[0]) + tolower(szLocale[1]);
550 }
551
552 // save the old locale to be able to restore it later
553 m_pOldLocale = wxSetLocale(this);
554
555 // load the default catalog with wxWindows standard messages
556 m_pMsgCat = NULL;
557 bool bOk = TRUE;
558 if ( bLoadDefault )
559 bOk = AddCatalog(wxT("wxstd"));
560
561 return bOk;
562}
563
564void wxLocale::AddCatalogLookupPathPrefix(const wxString& prefix)
565{
566 if ( s_searchPrefixes.Index(prefix) == wxNOT_FOUND )
567 {
568 s_searchPrefixes.Add(prefix);
569 }
570 //else: already have it
571}
572
573// clean up
574wxLocale::~wxLocale()
575{
576 // free memory
577 wxMsgCatalog *pTmpCat;
578 while ( m_pMsgCat != NULL ) {
579 pTmpCat = m_pMsgCat;
580 m_pMsgCat = m_pMsgCat->m_pNext;
581 delete pTmpCat;
582 }
583
584 // restore old locale
585 wxSetLocale(m_pOldLocale);
586 wxSetlocale(LC_ALL, m_pszOldLocale);
587}
588
589// get the translation of given string in current locale
590const wxMB2WXbuf wxLocale::GetString(const wxChar *szOrigString,
591 const wxChar *szDomain) const
592{
593 if ( wxIsEmpty(szOrigString) )
594 return szDomain;
595
596 const char *pszTrans = NULL;
597#if wxUSE_UNICODE
598 const wxWX2MBbuf szOrgString = wxConvCurrent->cWX2MB(szOrigString);
599#else // ANSI
600 #define szOrgString szOrigString
601#endif // Unicode/ANSI
602
603 wxMsgCatalog *pMsgCat;
604 if ( szDomain != NULL ) {
605 pMsgCat = FindCatalog(szDomain);
606
607 // does the catalog exist?
608 if ( pMsgCat != NULL )
609 pszTrans = pMsgCat->GetString(szOrgString);
610 }
611 else {
612 // search in all domains
613 for ( pMsgCat = m_pMsgCat; pMsgCat != NULL; pMsgCat = pMsgCat->m_pNext ) {
614 pszTrans = pMsgCat->GetString(szOrgString);
615 if ( pszTrans != NULL ) // take the first found
616 break;
617 }
618 }
619
620 if ( pszTrans == NULL ) {
621 if ( wxIsLoggingTransErrors() ) {
622 // suppress further error messages if we're not debugging: this avoids
623 // flooding the user with messages about each and every missing string if,
624 // for example, a whole catalog file is missing.
625
626 // do it before calling LogWarning to prevent infinite recursion!
627#ifdef __WXDEBUG__
628 NoTransErr noTransErr;
629#else // !debug
630 wxSuppressTransErrors();
631#endif // debug/!debug
632
633 if ( szDomain != NULL )
634 {
635 wxLogWarning(_("string '%s' not found in domain '%s' for locale '%s'."),
636 szOrigString, szDomain, m_strLocale.c_str());
637 }
638 else
639 {
640 wxLogWarning(_("string '%s' not found in locale '%s'."),
641 szOrigString, m_strLocale.c_str());
642 }
643 }
644
645 return (wxMB2WXbuf)(szOrigString);
646 }
647 else
648 {
649 return wxConvertMB2WX(pszTrans); // or preferably wxCSConv(charset).cMB2WX(pszTrans) or something,
650 // a macro similar to wxConvertMB2WX could be written for that
651 }
652
653 #undef szOrgString
654}
655
656// find catalog by name in a linked list, return NULL if !found
657wxMsgCatalog *wxLocale::FindCatalog(const wxChar *szDomain) const
658{
659// linear search in the linked list
660 wxMsgCatalog *pMsgCat;
661 for ( pMsgCat = m_pMsgCat; pMsgCat != NULL; pMsgCat = pMsgCat->m_pNext ) {
662 if ( wxStricmp(pMsgCat->GetName(), szDomain) == 0 )
663 return pMsgCat;
664 }
665
666 return NULL;
667}
668
669// check if the given catalog is loaded
670bool wxLocale::IsLoaded(const wxChar *szDomain) const
671{
672 return FindCatalog(szDomain) != NULL;
673}
674
675// add a catalog to our linked list
676bool wxLocale::AddCatalog(const wxChar *szDomain)
677{
678 wxMsgCatalog *pMsgCat = new wxMsgCatalog;
679
680 if ( pMsgCat->Load(m_strShort, szDomain, m_bConvertEncoding) ) {
681 // add it to the head of the list so that in GetString it will
682 // be searched before the catalogs added earlier
683 pMsgCat->m_pNext = m_pMsgCat;
684 m_pMsgCat = pMsgCat;
685
686 return TRUE;
687 }
688 else {
689 // don't add it because it couldn't be loaded anyway
690 delete pMsgCat;
691
692 return FALSE;
693 }
694}
695
696// ----------------------------------------------------------------------------
697// global functions and variables
698// ----------------------------------------------------------------------------
699
700// translation errors logging
701// --------------------------
702
703static bool gs_bGiveTransErrors = TRUE;
704
705void wxSuppressTransErrors()
706{
707 gs_bGiveTransErrors = FALSE;
708}
709
710void wxRestoreTransErrors()
711{
712 gs_bGiveTransErrors = TRUE;
713}
714
715bool wxIsLoggingTransErrors()
716{
717 return gs_bGiveTransErrors;
718}
719
720// retrieve/change current locale
721// ------------------------------
722
723// the current locale object
724static wxLocale *g_pLocale = NULL;
725
726wxLocale *wxGetLocale()
727{
728 return g_pLocale;
729}
730
731wxLocale *wxSetLocale(wxLocale *pLocale)
732{
733 wxLocale *pOld = g_pLocale;
734 g_pLocale = pLocale;
735 return pOld;
736}
737
738#endif // wxUSE_INTL
739