]>
git.saurik.com Git - apple/icu.git/blob - icuSources/common/resbund.cpp
2 **********************************************************************
3 * Copyright (C) 1997-2004, International Business Machines
4 * Corporation and others. All Rights Reserved.
5 **********************************************************************
9 * Modification History:
11 * Date Name Description
12 * 02/05/97 aliu Fixed bug in chopLocale. Added scanForLocaleInFile
13 * based on code taken from scanForLocale. Added
14 * constructor which attempts to read resource bundle
15 * from a specific file, without searching other files.
16 * 02/11/97 aliu Added UErrorCode return values to constructors. Fixed
17 * infinite loops in scanForFile and scanForLocale.
18 * Modified getRawResourceData to not delete storage in
19 * localeData and resourceData which it doesn't own.
20 * Added Mac compatibility #ifdefs for tellp() and
22 * 03/04/97 aliu Modified to use ExpandingDataSink objects instead of
23 * the highly inefficient ostrstream objects.
24 * 03/13/97 aliu Rewrote to load in entire resource bundle and store
25 * it as a Hashtable of ResourceBundleData objects.
26 * Added state table to govern parsing of files.
27 * Modified to load locale index out of new file distinct
29 * 03/25/97 aliu Modified to support 2-d arrays, needed for timezone data.
30 * Added support for custom file suffixes. Again, needed
31 * to support timezone data. Improved error handling to
32 * detect duplicate tags and subtags.
33 * 04/07/97 aliu Fixed bug in getHashtableForLocale(). Fixed handling
34 * of failing UErrorCode values on entry to API methods.
35 * Fixed bugs in getArrayItem() for negative indices.
36 * 04/29/97 aliu Update to use new Hashtable deletion protocol.
37 * 05/06/97 aliu Flattened kTransitionTable for HP compiler.
38 * Fixed usage of CharString.
39 * 06/11/99 stephen Removed parsing of .txt files.
40 * Reworked to use new binary format.
42 * 06/14/99 stephen Removed methods taking a filename suffix.
43 * 06/22/99 stephen Added missing T_FileStream_close in parse()
44 * 11/09/99 weiv Added getLocale(), rewritten constructForLocale()
45 * March 2000 weiv complete overhaul.
46 ******************************************************************************
49 #include "unicode/utypes.h"
50 #include "unicode/resbund.h"
57 /*-----------------------------------------------------------------------------
58 * Implementation Notes
60 * Resource bundles are read in once, and thereafter cached.
61 * ResourceBundle statically keeps track of which files have been
62 * read, so we are guaranteed that each file is read at most once.
63 * Resource bundles can be loaded from different data directories and
64 * will be treated as distinct, even if they are for the same locale.
66 * Resource bundles are lightweight objects, which have pointers to
67 * one or more shared Hashtable objects containing all the data.
68 * Copying would be cheap, but there is no copy constructor, since
69 * there wasn't one in the original API.
71 * The ResourceBundle parsing mechanism is implemented as a transition
72 * network, for easy maintenance and modification. The network is
73 * implemented as a matrix (instead of in code) to make this even
74 * easier. The matrix contains Transition objects. Each Transition
75 * object describes a destination node and an action to take before
76 * moving to the destination node. The source node is encoded by the
77 * index of the object in the array that contains it. The pieces
78 * needed to understand the transition network are the enums for node
79 * IDs and actions, the parse() method, which walks through the
80 * network and implements the actions, and the network itself. The
81 * network guarantees certain conditions, for example, that a new
82 * resource will not be closed until one has been opened first; or
83 * that data will not be stored into a TaggedList until a TaggedList
84 * has been created. Nonetheless, the code in parse() does some
85 * consistency checks as it runs the network, and fails with an
86 * U_INTERNAL_PROGRAM_ERROR if one of these checks fails. If the input
87 * data has a bad format, an U_INVALID_FORMAT_ERROR is returned. If you
88 * see an U_INTERNAL_PROGRAM_ERROR the transition matrix has a bug in
91 * Old functionality of multiple locales in a single file is still
92 * supported. For this reason, LOCALE names override FILE names. If
93 * data for en_US is located in the en.txt file, once it is loaded,
94 * the code will not care where it came from (other than remembering
95 * which directory it came from). However, if there is an en_US
96 * resource in en_US.txt, that will take precedence. There is no
97 * limit to the number or type of resources that can be stored in a
98 * file, however, files are only searched in a specific way. If
99 * en_US_CA is requested, then first en_US_CA.txt is searched, then
100 * en_US.txt, then en.txt, then default.txt. So it only makes sense
101 * to put certain locales in certain files. In this example, it would
102 * be logical to put en_US_CA, en_US, and en into the en.txt file,
103 * since they would be found there if asked for. The extreme example
104 * is to place all locale resources into default.txt, which should
107 * Inheritance is implemented. For example, xx_YY_zz inherits as
108 * follows: xx_YY_zz, xx_YY, xx, default. Inheritance is implemented
109 * as an array of hashtables. There will be from 1 to 4 hashtables in
112 * Fallback files are implemented. The fallback pattern is Language
113 * Country Variant (LCV) -> LC -> L. Fallback is first done for the
114 * requested locale. Then it is done for the default locale, as
115 * returned by Locale::getDefault(). Then the special file
116 * default.txt is searched for the default locale. The overall FILE
117 * fallback path is LCV -> LC -> L -> dLCV -> dLC -> dL -> default.
119 * Note that although file name searching includes the default locale,
120 * once a ResourceBundle object is constructed, the inheritance path
121 * no longer includes the default locale. The path is LCV -> LC -> L
124 * File parsing is lazy. Nothing is parsed unless it is called for by
125 * someone. So when a ResourceBundle for xx_YY_zz is constructed,
126 * only that locale is parsed (along with anything else in the same
127 * file). Later, if the FooBar tag is asked for, and if it isn't
128 * found in xx_YY_zz, then xx_YY.txt will be parsed and checked, and
129 * so forth, until the chain is exhausted or the tag is found.
131 * Thread-safety is implemented around caches, both the cache that
132 * stores all the resouce data, and the cache that stores flags
133 * indicating whether or not a file has been visited. These caches
134 * delete their storage at static cleanup time, when the process
137 * ResourceBundle supports TableCollation as a special case. This
138 * involves having special ResourceBundle objects which DO own their
139 * data, since we don't want large collation rule strings in the
140 * ResourceBundle cache (these are already cached in the
141 * TableCollation cache). TableCollation files (.ctx files) have the
142 * same format as normal resource data files, with a different
143 * interpretation, from the standpoint of ResourceBundle. .ctx files
144 * are loaded into otherwise ordinary ResourceBundle objects. They
145 * don't inherit (that's implemented by TableCollation) and they own
146 * their data (as mentioned above). However, they still support
147 * possible multiple locales in a single .ctx file. (This is in
148 * practice a bad idea, since you only want the one locale you're
149 * looking for, and only one tag will be present
150 * ("CollationElements"), so you don't need an inheritance chain of
151 * multiple locales.) Up to 4 locale resources will be loaded from a
152 * .ctx file; everything after the first 4 is ignored (parsed and
153 * deleted). (Normal .txt files have no limit.) Instead of being
154 * loaded into the cache, and then looked up as needed, the locale
155 * resources are read straight into the ResourceBundle object.
157 * The Index, which used to reside in default.txt, has been moved to a
158 * new file, index.txt. This file contains a slightly modified format
159 * with the addition of the "InstalledLocales" tag; it looks like:
169 //-----------------------------------------------------------------------------
171 UOBJECT_DEFINE_RTTI_IMPLEMENTATION(ResourceBundle
)
173 ResourceBundle::ResourceBundle(UErrorCode
&err
)
174 :UObject(), fLocale(NULL
)
176 fResource
= ures_open(0, Locale::getDefault().getName(), &err
);
179 ResourceBundle::ResourceBundle(const ResourceBundle
&other
)
180 :UObject(other
), fLocale(NULL
)
182 UErrorCode status
= U_ZERO_ERROR
;
184 if (other
.fResource
) {
185 fResource
= ures_copyResb(0, other
.fResource
, &status
);
187 /* Copying a bad resource bundle */
192 ResourceBundle::ResourceBundle(UResourceBundle
*res
, UErrorCode
& err
)
193 :UObject(), fLocale(NULL
)
196 fResource
= ures_copyResb(0, res
, &err
);
198 /* Copying a bad resource bundle */
203 ResourceBundle::ResourceBundle(const char* path
, const Locale
& locale
, UErrorCode
& err
)
204 :UObject(), fLocale(NULL
)
206 fResource
= ures_open(path
, locale
.getName(), &err
);
210 ResourceBundle
& ResourceBundle::operator=(const ResourceBundle
& other
)
216 ures_close(fResource
);
219 UErrorCode status
= U_ZERO_ERROR
;
220 if (other
.fResource
) {
221 fResource
= ures_copyResb(0, other
.fResource
, &status
);
223 /* Copying a bad resource bundle */
229 ResourceBundle::~ResourceBundle()
232 ures_close(fResource
);
234 if(fLocale
!= NULL
) {
240 ResourceBundle::clone() const {
241 return new ResourceBundle(*this);
244 UnicodeString
ResourceBundle::getString(UErrorCode
& status
) const {
246 const UChar
*r
= ures_getString(fResource
, &len
, &status
);
247 return UnicodeString(TRUE
, r
, len
);
250 const uint8_t *ResourceBundle::getBinary(int32_t& len
, UErrorCode
& status
) const {
251 return ures_getBinary(fResource
, &len
, &status
);
254 const int32_t *ResourceBundle::getIntVector(int32_t& len
, UErrorCode
& status
) const {
255 return ures_getIntVector(fResource
, &len
, &status
);
258 uint32_t ResourceBundle::getUInt(UErrorCode
& status
) const {
259 return ures_getUInt(fResource
, &status
);
262 int32_t ResourceBundle::getInt(UErrorCode
& status
) const {
263 return ures_getInt(fResource
, &status
);
266 const char *ResourceBundle::getName(void) const {
267 return ures_getName(fResource
);
270 const char *ResourceBundle::getKey(void) const {
271 return ures_getKey(fResource
);
274 UResType
ResourceBundle::getType(void) const {
275 return ures_getType(fResource
);
278 int32_t ResourceBundle::getSize(void) const {
279 return ures_getSize(fResource
);
282 UBool
ResourceBundle::hasNext(void) const {
283 return ures_hasNext(fResource
);
286 void ResourceBundle::resetIterator(void) {
287 ures_resetIterator(fResource
);
290 ResourceBundle
ResourceBundle::getNext(UErrorCode
& status
) {
293 ures_initStackObject(&r
);
294 ures_getNextResource(fResource
, &r
, &status
);
295 ResourceBundle
res(&r
, status
);
296 if (U_SUCCESS(status
)) {
302 UnicodeString
ResourceBundle::getNextString(UErrorCode
& status
) {
304 const UChar
* r
= ures_getNextString(fResource
, &len
, 0, &status
);
305 return UnicodeString(TRUE
, r
, len
);
308 UnicodeString
ResourceBundle::getNextString(const char ** key
, UErrorCode
& status
) {
310 const UChar
* r
= ures_getNextString(fResource
, &len
, key
, &status
);
311 return UnicodeString(TRUE
, r
, len
);
314 ResourceBundle
ResourceBundle::get(int32_t indexR
, UErrorCode
& status
) const {
317 ures_initStackObject(&r
);
318 ures_getByIndex(fResource
, indexR
, &r
, &status
);
319 ResourceBundle
res(&r
, status
);
320 if (U_SUCCESS(status
)) {
326 UnicodeString
ResourceBundle::getStringEx(int32_t indexS
, UErrorCode
& status
) const {
328 const UChar
* r
= ures_getStringByIndex(fResource
, indexS
, &len
, &status
);
329 return UnicodeString(TRUE
, r
, len
);
332 ResourceBundle
ResourceBundle::get(const char* key
, UErrorCode
& status
) const {
335 ures_initStackObject(&r
);
336 ures_getByKey(fResource
, key
, &r
, &status
);
337 ResourceBundle
res(&r
, status
);
338 if (U_SUCCESS(status
)) {
344 ResourceBundle
ResourceBundle::getWithFallback(const char* key
, UErrorCode
& status
){
346 ures_initStackObject(&r
);
347 ures_getByKeyWithFallback(fResource
, key
, &r
, &status
);
348 ResourceBundle
res(&r
, status
);
349 if(U_SUCCESS(status
)){
354 UnicodeString
ResourceBundle::getStringEx(const char* key
, UErrorCode
& status
) const {
356 const UChar
* r
= ures_getStringByKey(fResource
, key
, &len
, &status
);
357 return UnicodeString(TRUE
, r
, len
);
361 ResourceBundle::getVersionNumber() const
363 return ures_getVersionNumber(fResource
);
366 void ResourceBundle::getVersion(UVersionInfo versionInfo
) const {
367 ures_getVersion(fResource
, versionInfo
);
370 const Locale
&ResourceBundle::getLocale(void) const
374 needInit
= (fLocale
== NULL
);
377 UErrorCode status
= U_ZERO_ERROR
;
378 const char *localeName
= ures_getLocale(fResource
, &status
);
379 Locale
*tLocale
= new Locale(localeName
);
381 ResourceBundle
*me
= (ResourceBundle
*)this; // semantically const
382 if (me
->fLocale
== NULL
) {
383 me
->fLocale
= tLocale
;
392 const Locale
ResourceBundle::getLocale(ULocDataLocaleType type
, UErrorCode
&status
) const
394 return ures_getLocaleByType(fResource
, type
, &status
);