]> git.saurik.com Git - apple/icu.git/blame - icuSources/common/resbund.cpp
ICU-6.2.4.tar.gz
[apple/icu.git] / icuSources / common / resbund.cpp
CommitLineData
b75a7d8f
A
1/*
2**********************************************************************
374ca955 3* Copyright (C) 1997-2004, International Business Machines
b75a7d8f
A
4* Corporation and others. All Rights Reserved.
5**********************************************************************
6*
7* File resbund.cpp
8*
9* Modification History:
10*
11* Date Name Description
12* 02/05/97 aliu Fixed bug in chopLocale. Added scanForLocaleInFile
13* based on code taken from scanForLocale. Added
14* constructor which attempts to read resource bundle
15* from a specific file, without searching other files.
16* 02/11/97 aliu Added UErrorCode return values to constructors. Fixed
17* infinite loops in scanForFile and scanForLocale.
18* Modified getRawResourceData to not delete storage in
19* localeData and resourceData which it doesn't own.
20* Added Mac compatibility #ifdefs for tellp() and
21* ios::nocreate.
22* 03/04/97 aliu Modified to use ExpandingDataSink objects instead of
23* the highly inefficient ostrstream objects.
24* 03/13/97 aliu Rewrote to load in entire resource bundle and store
25* it as a Hashtable of ResourceBundleData objects.
26* Added state table to govern parsing of files.
27* Modified to load locale index out of new file distinct
28* from default.txt.
29* 03/25/97 aliu Modified to support 2-d arrays, needed for timezone data.
30* Added support for custom file suffixes. Again, needed
31* to support timezone data. Improved error handling to
32* detect duplicate tags and subtags.
33* 04/07/97 aliu Fixed bug in getHashtableForLocale(). Fixed handling
34* of failing UErrorCode values on entry to API methods.
35* Fixed bugs in getArrayItem() for negative indices.
36* 04/29/97 aliu Update to use new Hashtable deletion protocol.
37* 05/06/97 aliu Flattened kTransitionTable for HP compiler.
38* Fixed usage of CharString.
39* 06/11/99 stephen Removed parsing of .txt files.
40* Reworked to use new binary format.
41* Cleaned up.
42* 06/14/99 stephen Removed methods taking a filename suffix.
43* 06/22/99 stephen Added missing T_FileStream_close in parse()
44* 11/09/99 weiv Added getLocale(), rewritten constructForLocale()
45* March 2000 weiv complete overhaul.
46******************************************************************************
47*/
48
49#include "unicode/utypes.h"
50#include "unicode/resbund.h"
374ca955 51#include "umutex.h"
b75a7d8f
A
52
53#include "uresimp.h"
54
55U_NAMESPACE_BEGIN
56
57/*-----------------------------------------------------------------------------
58 * Implementation Notes
59 *
60 * Resource bundles are read in once, and thereafter cached.
61 * ResourceBundle statically keeps track of which files have been
62 * read, so we are guaranteed that each file is read at most once.
63 * Resource bundles can be loaded from different data directories and
64 * will be treated as distinct, even if they are for the same locale.
65 *
66 * Resource bundles are lightweight objects, which have pointers to
67 * one or more shared Hashtable objects containing all the data.
68 * Copying would be cheap, but there is no copy constructor, since
69 * there wasn't one in the original API.
70 *
71 * The ResourceBundle parsing mechanism is implemented as a transition
72 * network, for easy maintenance and modification. The network is
73 * implemented as a matrix (instead of in code) to make this even
74 * easier. The matrix contains Transition objects. Each Transition
75 * object describes a destination node and an action to take before
76 * moving to the destination node. The source node is encoded by the
77 * index of the object in the array that contains it. The pieces
78 * needed to understand the transition network are the enums for node
79 * IDs and actions, the parse() method, which walks through the
80 * network and implements the actions, and the network itself. The
81 * network guarantees certain conditions, for example, that a new
82 * resource will not be closed until one has been opened first; or
83 * that data will not be stored into a TaggedList until a TaggedList
84 * has been created. Nonetheless, the code in parse() does some
85 * consistency checks as it runs the network, and fails with an
86 * U_INTERNAL_PROGRAM_ERROR if one of these checks fails. If the input
87 * data has a bad format, an U_INVALID_FORMAT_ERROR is returned. If you
88 * see an U_INTERNAL_PROGRAM_ERROR the transition matrix has a bug in
89 * it.
90 *
91 * Old functionality of multiple locales in a single file is still
92 * supported. For this reason, LOCALE names override FILE names. If
93 * data for en_US is located in the en.txt file, once it is loaded,
94 * the code will not care where it came from (other than remembering
95 * which directory it came from). However, if there is an en_US
96 * resource in en_US.txt, that will take precedence. There is no
97 * limit to the number or type of resources that can be stored in a
98 * file, however, files are only searched in a specific way. If
99 * en_US_CA is requested, then first en_US_CA.txt is searched, then
100 * en_US.txt, then en.txt, then default.txt. So it only makes sense
101 * to put certain locales in certain files. In this example, it would
102 * be logical to put en_US_CA, en_US, and en into the en.txt file,
103 * since they would be found there if asked for. The extreme example
104 * is to place all locale resources into default.txt, which should
105 * also work.
106 *
107 * Inheritance is implemented. For example, xx_YY_zz inherits as
108 * follows: xx_YY_zz, xx_YY, xx, default. Inheritance is implemented
109 * as an array of hashtables. There will be from 1 to 4 hashtables in
110 * the array.
111 *
112 * Fallback files are implemented. The fallback pattern is Language
113 * Country Variant (LCV) -> LC -> L. Fallback is first done for the
114 * requested locale. Then it is done for the default locale, as
115 * returned by Locale::getDefault(). Then the special file
116 * default.txt is searched for the default locale. The overall FILE
117 * fallback path is LCV -> LC -> L -> dLCV -> dLC -> dL -> default.
118 *
119 * Note that although file name searching includes the default locale,
120 * once a ResourceBundle object is constructed, the inheritance path
121 * no longer includes the default locale. The path is LCV -> LC -> L
122 * -> default.
123 *
124 * File parsing is lazy. Nothing is parsed unless it is called for by
125 * someone. So when a ResourceBundle for xx_YY_zz is constructed,
126 * only that locale is parsed (along with anything else in the same
127 * file). Later, if the FooBar tag is asked for, and if it isn't
128 * found in xx_YY_zz, then xx_YY.txt will be parsed and checked, and
129 * so forth, until the chain is exhausted or the tag is found.
130 *
131 * Thread-safety is implemented around caches, both the cache that
132 * stores all the resouce data, and the cache that stores flags
133 * indicating whether or not a file has been visited. These caches
134 * delete their storage at static cleanup time, when the process
135 * quits.
136 *
137 * ResourceBundle supports TableCollation as a special case. This
138 * involves having special ResourceBundle objects which DO own their
139 * data, since we don't want large collation rule strings in the
140 * ResourceBundle cache (these are already cached in the
141 * TableCollation cache). TableCollation files (.ctx files) have the
142 * same format as normal resource data files, with a different
143 * interpretation, from the standpoint of ResourceBundle. .ctx files
144 * are loaded into otherwise ordinary ResourceBundle objects. They
145 * don't inherit (that's implemented by TableCollation) and they own
146 * their data (as mentioned above). However, they still support
147 * possible multiple locales in a single .ctx file. (This is in
148 * practice a bad idea, since you only want the one locale you're
149 * looking for, and only one tag will be present
150 * ("CollationElements"), so you don't need an inheritance chain of
151 * multiple locales.) Up to 4 locale resources will be loaded from a
152 * .ctx file; everything after the first 4 is ignored (parsed and
153 * deleted). (Normal .txt files have no limit.) Instead of being
154 * loaded into the cache, and then looked up as needed, the locale
155 * resources are read straight into the ResourceBundle object.
156 *
157 * The Index, which used to reside in default.txt, has been moved to a
158 * new file, index.txt. This file contains a slightly modified format
159 * with the addition of the "InstalledLocales" tag; it looks like:
160 *
161 * Index {
162 * InstalledLocales {
163 * ar
164 * ..
165 * zh_TW
166 * }
167 * }
168 */
169//-----------------------------------------------------------------------------
170
374ca955 171UOBJECT_DEFINE_RTTI_IMPLEMENTATION(ResourceBundle)
b75a7d8f
A
172
173ResourceBundle::ResourceBundle(UErrorCode &err)
374ca955 174 :UObject(), fLocale(NULL)
b75a7d8f 175{
374ca955 176 fResource = ures_open(0, Locale::getDefault().getName(), &err);
b75a7d8f
A
177}
178
179ResourceBundle::ResourceBundle(const ResourceBundle &other)
374ca955 180 :UObject(other), fLocale(NULL)
b75a7d8f
A
181{
182 UErrorCode status = U_ZERO_ERROR;
183
374ca955
A
184 if (other.fResource) {
185 fResource = ures_copyResb(0, other.fResource, &status);
b75a7d8f
A
186 } else {
187 /* Copying a bad resource bundle */
374ca955 188 fResource = NULL;
b75a7d8f
A
189 }
190}
191
192ResourceBundle::ResourceBundle(UResourceBundle *res, UErrorCode& err)
374ca955 193 :UObject(), fLocale(NULL)
b75a7d8f
A
194{
195 if (res) {
374ca955 196 fResource = ures_copyResb(0, res, &err);
b75a7d8f
A
197 } else {
198 /* Copying a bad resource bundle */
374ca955 199 fResource = NULL;
b75a7d8f
A
200 }
201}
202
203ResourceBundle::ResourceBundle(const char* path, const Locale& locale, UErrorCode& err)
374ca955 204 :UObject(), fLocale(NULL)
b75a7d8f 205{
374ca955 206 fResource = ures_open(path, locale.getName(), &err);
b75a7d8f
A
207}
208
209
210ResourceBundle& ResourceBundle::operator=(const ResourceBundle& other)
211{
212 if(this == &other) {
213 return *this;
214 }
374ca955
A
215 if(fResource != 0) {
216 ures_close(fResource);
217 fResource = NULL;
b75a7d8f
A
218 }
219 UErrorCode status = U_ZERO_ERROR;
374ca955
A
220 if (other.fResource) {
221 fResource = ures_copyResb(0, other.fResource, &status);
b75a7d8f
A
222 } else {
223 /* Copying a bad resource bundle */
374ca955 224 fResource = NULL;
b75a7d8f
A
225 }
226 return *this;
227}
228
229ResourceBundle::~ResourceBundle()
230{
374ca955
A
231 if(fResource != 0) {
232 ures_close(fResource);
b75a7d8f 233 }
374ca955
A
234 if(fLocale != NULL) {
235 delete(fLocale);
b75a7d8f
A
236 }
237}
238
374ca955
A
239ResourceBundle *
240ResourceBundle::clone() const {
241 return new ResourceBundle(*this);
b75a7d8f
A
242}
243
244UnicodeString ResourceBundle::getString(UErrorCode& status) const {
245 int32_t len = 0;
374ca955 246 const UChar *r = ures_getString(fResource, &len, &status);
b75a7d8f
A
247 return UnicodeString(TRUE, r, len);
248}
249
250const uint8_t *ResourceBundle::getBinary(int32_t& len, UErrorCode& status) const {
374ca955 251 return ures_getBinary(fResource, &len, &status);
b75a7d8f
A
252}
253
254const int32_t *ResourceBundle::getIntVector(int32_t& len, UErrorCode& status) const {
374ca955 255 return ures_getIntVector(fResource, &len, &status);
b75a7d8f
A
256}
257
258uint32_t ResourceBundle::getUInt(UErrorCode& status) const {
374ca955 259 return ures_getUInt(fResource, &status);
b75a7d8f
A
260}
261
262int32_t ResourceBundle::getInt(UErrorCode& status) const {
374ca955 263 return ures_getInt(fResource, &status);
b75a7d8f
A
264}
265
374ca955
A
266const char *ResourceBundle::getName(void) const {
267 return ures_getName(fResource);
b75a7d8f
A
268}
269
374ca955
A
270const char *ResourceBundle::getKey(void) const {
271 return ures_getKey(fResource);
b75a7d8f
A
272}
273
374ca955
A
274UResType ResourceBundle::getType(void) const {
275 return ures_getType(fResource);
b75a7d8f
A
276}
277
278int32_t ResourceBundle::getSize(void) const {
374ca955 279 return ures_getSize(fResource);
b75a7d8f
A
280}
281
282UBool ResourceBundle::hasNext(void) const {
374ca955 283 return ures_hasNext(fResource);
b75a7d8f
A
284}
285
286void ResourceBundle::resetIterator(void) {
374ca955 287 ures_resetIterator(fResource);
b75a7d8f
A
288}
289
290ResourceBundle ResourceBundle::getNext(UErrorCode& status) {
291 UResourceBundle r;
292
293 ures_initStackObject(&r);
374ca955 294 ures_getNextResource(fResource, &r, &status);
b75a7d8f
A
295 ResourceBundle res(&r, status);
296 if (U_SUCCESS(status)) {
297 ures_close(&r);
298 }
299 return res;
300}
301
302UnicodeString ResourceBundle::getNextString(UErrorCode& status) {
303 int32_t len = 0;
374ca955 304 const UChar* r = ures_getNextString(fResource, &len, 0, &status);
b75a7d8f
A
305 return UnicodeString(TRUE, r, len);
306}
307
308UnicodeString ResourceBundle::getNextString(const char ** key, UErrorCode& status) {
309 int32_t len = 0;
374ca955 310 const UChar* r = ures_getNextString(fResource, &len, key, &status);
b75a7d8f
A
311 return UnicodeString(TRUE, r, len);
312}
313
314ResourceBundle ResourceBundle::get(int32_t indexR, UErrorCode& status) const {
315 UResourceBundle r;
316
317 ures_initStackObject(&r);
374ca955 318 ures_getByIndex(fResource, indexR, &r, &status);
b75a7d8f
A
319 ResourceBundle res(&r, status);
320 if (U_SUCCESS(status)) {
321 ures_close(&r);
322 }
323 return res;
324}
325
326UnicodeString ResourceBundle::getStringEx(int32_t indexS, UErrorCode& status) const {
327 int32_t len = 0;
374ca955 328 const UChar* r = ures_getStringByIndex(fResource, indexS, &len, &status);
b75a7d8f
A
329 return UnicodeString(TRUE, r, len);
330}
331
332ResourceBundle ResourceBundle::get(const char* key, UErrorCode& status) const {
333 UResourceBundle r;
334
335 ures_initStackObject(&r);
374ca955 336 ures_getByKey(fResource, key, &r, &status);
b75a7d8f
A
337 ResourceBundle res(&r, status);
338 if (U_SUCCESS(status)) {
339 ures_close(&r);
340 }
341 return res;
342}
343
374ca955
A
344ResourceBundle ResourceBundle::getWithFallback(const char* key, UErrorCode& status){
345 UResourceBundle r;
346 ures_initStackObject(&r);
347 ures_getByKeyWithFallback(fResource, key, &r, &status);
348 ResourceBundle res(&r, status);
349 if(U_SUCCESS(status)){
350 ures_close(&r);
351 }
352 return res;
353}
b75a7d8f
A
354UnicodeString ResourceBundle::getStringEx(const char* key, UErrorCode& status) const {
355 int32_t len = 0;
374ca955 356 const UChar* r = ures_getStringByKey(fResource, key, &len, &status);
b75a7d8f
A
357 return UnicodeString(TRUE, r, len);
358}
359
360const char*
361ResourceBundle::getVersionNumber() const
362{
374ca955 363 return ures_getVersionNumber(fResource);
b75a7d8f
A
364}
365
366void ResourceBundle::getVersion(UVersionInfo versionInfo) const {
374ca955 367 ures_getVersion(fResource, versionInfo);
b75a7d8f
A
368}
369
370const Locale &ResourceBundle::getLocale(void) const
371{
374ca955
A
372 UBool needInit;
373 umtx_lock(NULL);
374 needInit = (fLocale == NULL);
375 umtx_unlock(NULL);
376 if(needInit) {
377 UErrorCode status = U_ZERO_ERROR;
378 const char *localeName = ures_getLocale(fResource, &status);
379 Locale *tLocale = new Locale(localeName);
380 umtx_lock(NULL);
381 ResourceBundle *me = (ResourceBundle *)this; // semantically const
382 if (me->fLocale == NULL) {
383 me->fLocale = tLocale;
384 tLocale = NULL;
385 }
386 umtx_unlock(NULL);
387 delete tLocale;
388 }
389 return *fLocale;
390}
391
392const Locale ResourceBundle::getLocale(ULocDataLocaleType type, UErrorCode &status) const
393{
394 return ures_getLocaleByType(fResource, type, &status);
b75a7d8f
A
395}
396
397//eof
398U_NAMESPACE_END