]> git.saurik.com Git - apple/cf.git/blame_incremental - Parsing.subproj/CFXMLParser.h
CF-299.tar.gz
[apple/cf.git] / Parsing.subproj / CFXMLParser.h
... / ...
CommitLineData
1/*
2 * Copyright (c) 2003 Apple Computer, Inc. All rights reserved.
3 *
4 * @APPLE_LICENSE_HEADER_START@
5 *
6 * Copyright (c) 1999-2003 Apple Computer, Inc. All Rights Reserved.
7 *
8 * This file contains Original Code and/or Modifications of Original Code
9 * as defined in and that are subject to the Apple Public Source License
10 * Version 2.0 (the 'License'). You may not use this file except in
11 * compliance with the License. Please obtain a copy of the License at
12 * http://www.opensource.apple.com/apsl/ and read it before using this
13 * file.
14 *
15 * The Original Code and all software distributed under the License are
16 * distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER
17 * EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES,
18 * INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY,
19 * FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT.
20 * Please see the License for the specific language governing rights and
21 * limitations under the License.
22 *
23 * @APPLE_LICENSE_HEADER_END@
24 */
25/* CFXMLParser.h
26 Copyright (c) 1998-2003, Apple, Inc. All rights reserved.
27*/
28
29#if !defined(__COREFOUNDATION_CFXMLPARSER__)
30#define __COREFOUNDATION_CFXMLPARSER__ 1
31
32#include <CoreFoundation/CFBase.h>
33#include <CoreFoundation/CFArray.h>
34#include <CoreFoundation/CFData.h>
35#include <CoreFoundation/CFDictionary.h>
36#include <CoreFoundation/CFTree.h>
37#include <CoreFoundation/CFURL.h>
38#include <CoreFoundation/CFXMLNode.h>
39
40#if defined(__cplusplus)
41extern "C" {
42#endif
43
44typedef struct __CFXMLParser * CFXMLParserRef;
45
46/* These are the various options you can configure the parser with. These are
47 chosen such that an option flag of 0 (kCFXMLParserNoOptions) leaves the XML
48 as "intact" as possible (reports all structures; performs no replacements).
49 Hence, to make the parser do the most work, returning only the pure element
50 tree, set the option flag to kCFXMLParserAllOptions.
51
52kCFXMLParserValidateDocument -
53 validate the document against its grammar from the DTD, reporting any errors.
54 Currently not supported.
55
56kCFXMLParserSkipMetaData -
57 silently skip over metadata constructs (the DTD and comments)
58
59kCFXMLParserReplacePhysicalEntities -
60 replace declared entities like &lt;. Note that other than the 5 predefined
61 entities (lt, gt, quot, amp, apos), these must be defined in the DTD.
62 Currently not supported.
63
64kCFXMLParserSkipWhitespace -
65 skip over all whitespace that does not abut non-whitespace character data.
66 In other words, given <foo> <bar> blah </bar></foo>, the whitespace between
67 foo's open tag and bar's open tag would be suppressed, but the whitespace
68 around blah would be preserved.
69
70kCFXMLParserAddImpliedAttributes -
71 where the DTD specifies implied attribute-value pairs for a particular element,
72 add those pairs to any occurances of the element in the element tree.
73 Currently not supported.
74*/
75
76typedef enum {
77 kCFXMLParserValidateDocument = (1 << 0),
78 kCFXMLParserSkipMetaData = (1 << 1),
79 kCFXMLParserReplacePhysicalEntities = (1 << 2),
80 kCFXMLParserSkipWhitespace = (1 << 3),
81 kCFXMLParserResolveExternalEntities = (1 << 4),
82 kCFXMLParserAddImpliedAttributes = (1 << 5),
83 kCFXMLParserAllOptions = 0x00FFFFFF,
84 kCFXMLParserNoOptions = 0
85} CFXMLParserOptions;
86
87/* This list is expected to grow */
88typedef enum {
89 kCFXMLStatusParseNotBegun = -2,
90 kCFXMLStatusParseInProgress = -1,
91 kCFXMLStatusParseSuccessful = 0,
92 kCFXMLErrorUnexpectedEOF = 1,
93 kCFXMLErrorUnknownEncoding,
94 kCFXMLErrorEncodingConversionFailure,
95 kCFXMLErrorMalformedProcessingInstruction,
96 kCFXMLErrorMalformedDTD,
97 kCFXMLErrorMalformedName,
98 kCFXMLErrorMalformedCDSect,
99 kCFXMLErrorMalformedCloseTag,
100 kCFXMLErrorMalformedStartTag,
101 kCFXMLErrorMalformedDocument,
102 kCFXMLErrorElementlessDocument,
103 kCFXMLErrorMalformedComment,
104 kCFXMLErrorMalformedCharacterReference,
105 kCFXMLErrorMalformedParsedCharacterData,
106 kCFXMLErrorNoData
107} CFXMLParserStatusCode;
108
109
110/* These functions are called as a parse progresses.
111
112createXMLStructure -
113 called as new XML structures are encountered by the parser. May return NULL to indicate
114 that the given structure should be skipped; if NULL is returned for a given structure,
115 only minimal parsing is done for that structure (enough to correctly determine its end,
116 and to extract any data necessary for the remainder of the parse, such as Entity definitions).
117 createXMLStructure (or indeed, any of the tree-creation callbacks) will not be called for any
118 children of the skipped structure. The only exception is that the top-most element will always
119 be reported even if NULL was returned for the document as a whole. NOTE: for performance reasons,
120 the node passed to createXMLStructure cannot be safely retained by the client; the node as
121 a whole must be copied (via CFXMLNodeCreateCopy), or its contents must be extracted and copied.
122
123addChild -
124 called as children are parsed and are ready to be added to the tree. If createXMLStructure
125 returns NULL for a given structure, that structure is omitted entirely, and addChild will
126 NOT be called for either a NULL child or parent.
127
128endXMLStructure -
129 called once a structure (and all its children) are completely parsed. As elements are encountered,
130 createXMLStructure is called for them first, then addChild to add the new structure to its parent,
131 then addChild (potentially several times) to add the new structure's children to it, then finally
132 endXMLStructure to show that the structure has been fully parsed.
133
134createXMLStructure, addChild, and endXMLStructure are all REQUIRED TO BE NON-NULL.
135
136resolveExternalEntity -
137 called when external entities are referenced (NOT when they are simply defined). If the function
138 pointer is NULL, the parser uses its internal routines to try and resolve the entity. If the
139 function pointer is set, and the function returns NULL, a place holder for the external entity
140 is inserted into the tree. In this manner, the parser's client can prevent any external network
141 or file accesses.
142
143handleError - called as errors/warnings are encountered in the data stream. At some point, we will
144 have an enum of the expected errors, some of which will be fatal, others of which will not. If
145 the function pointer is NULL, the parser will silently attempt to recover. The
146 handleError function may always return false to force the parser to stop; if handleError returns
147 true, the parser will attempt to recover (fatal errors will still cause the parse to abort
148 immediately).
149*/
150
151typedef void * (*CFXMLParserCreateXMLStructureCallBack)(CFXMLParserRef parser, CFXMLNodeRef nodeDesc, void *info);
152typedef void (*CFXMLParserAddChildCallBack)(CFXMLParserRef parser, void *parent, void *child, void *info);
153typedef void (*CFXMLParserEndXMLStructureCallBack)(CFXMLParserRef parser, void *xmlType, void *info);
154typedef CFDataRef (*CFXMLParserResolveExternalEntityCallBack)(CFXMLParserRef parser, CFXMLExternalID *extID, void *info);
155typedef Boolean (*CFXMLParserHandleErrorCallBack)(CFXMLParserRef parser, CFXMLParserStatusCode error, void *info);
156typedef struct {
157 CFIndex version;
158 CFXMLParserCreateXMLStructureCallBack createXMLStructure;
159 CFXMLParserAddChildCallBack addChild;
160 CFXMLParserEndXMLStructureCallBack endXMLStructure;
161 CFXMLParserResolveExternalEntityCallBack resolveExternalEntity;
162 CFXMLParserHandleErrorCallBack handleError;
163} CFXMLParserCallBacks;
164
165typedef const void * (*CFXMLParserRetainCallBack)(const void *info);
166typedef void (*CFXMLParserReleaseCallBack)(const void *info);
167typedef CFStringRef (*CFXMLParserCopyDescriptionCallBack)(const void *info);
168typedef struct {
169 CFIndex version;
170 void * info;
171 CFXMLParserRetainCallBack retain;
172 CFXMLParserReleaseCallBack release;
173 CFXMLParserCopyDescriptionCallBack copyDescription;
174} CFXMLParserContext;
175
176CF_EXPORT
177CFTypeID CFXMLParserGetTypeID(void);
178
179/* Creates a parser which will parse the given data with the given options. xmlData may not be NULL.
180 dataSource should be the URL from which the data came, and may be NULL; it is used to resolve any
181 relative references found in xmlData. versionOfNodes determines which version CFXMLNodes are produced
182 by the parser; see CFXMLNode.h for more details. callBacks are the callbacks called by the parser as
183 the parse progresses; callBacks, callBacks->createXMLStructure, callBacks->addChild, and
184 callBacks->endXMLStructure must all be non-NULL. context determines what if any info pointer is
185 passed to the callbacks as the parse progresses; context may be NULL. */
186CF_EXPORT
187CFXMLParserRef CFXMLParserCreate(CFAllocatorRef allocator, CFDataRef xmlData, CFURLRef dataSource, CFOptionFlags parseOptions, CFIndex versionOfNodes, CFXMLParserCallBacks *callBacks, CFXMLParserContext *context);
188
189
190CF_EXPORT
191void CFXMLParserGetContext(CFXMLParserRef parser, CFXMLParserContext *context);
192
193CF_EXPORT
194void CFXMLParserGetCallBacks(CFXMLParserRef parser, CFXMLParserCallBacks *callBacks);
195
196CF_EXPORT
197CFURLRef CFXMLParserGetSourceURL(CFXMLParserRef parser);
198
199/* Returns the character index of the current parse location */
200CF_EXPORT
201CFIndex CFXMLParserGetLocation(CFXMLParserRef parser);
202
203/* Returns the line number of the current parse location */
204CF_EXPORT
205CFIndex CFXMLParserGetLineNumber(CFXMLParserRef parser);
206
207/* Returns the top-most object returned by the createXMLStructure callback */
208CF_EXPORT
209void *CFXMLParserGetDocument(CFXMLParserRef parser);
210
211/* Get the status code or a user-readable description of the last error that occurred in a parse.
212 If no error has occurred, a null description string is returned. See the enum above for
213 possible status returns */
214CF_EXPORT
215CFXMLParserStatusCode CFXMLParserGetStatusCode(CFXMLParserRef parser);
216
217CF_EXPORT
218CFStringRef CFXMLParserCopyErrorDescription(CFXMLParserRef parser);
219
220/* Cause any in-progress parse to abort with the given error code and description. errorCode
221 must be positive, and errorDescription may not be NULL. Cannot be called asynchronously
222 (i.e. must be called from within a parser callback) */
223CF_EXPORT
224void CFXMLParserAbort(CFXMLParserRef parser, CFXMLParserStatusCode errorCode, CFStringRef errorDescription);
225
226/* Starts a parse of the data the parser was created with; returns success or failure.
227 Upon success, use CFXMLParserGetDocument() to get the product of the parse. Upon
228 failure, use CFXMLParserGetErrorCode() or CFXMLParserCopyErrorDescription() to get
229 information about the error. It is an error to call CFXMLParserParse() while a
230 parse is already underway. */
231CF_EXPORT
232Boolean CFXMLParserParse(CFXMLParserRef parser);
233
234/* These functions provide a higher-level interface. The XML data is parsed to a
235 special CFTree (an CFXMLTree) with known contexts and callbacks. See CFXMLNode.h
236 for full details on using an CFXMLTree and the CFXMLNodes contained therein.
237*/
238/* Parse to an CFXMLTreeRef. parseOptions are as above. versionOfNodes determines
239 what version CFXMLNodes are used to populate the tree. */
240CF_EXPORT
241CFXMLTreeRef CFXMLTreeCreateFromData(CFAllocatorRef allocator, CFDataRef xmlData, CFURLRef dataSource, CFOptionFlags parseOptions, CFIndex versionOfNodes);
242
243/* As above, with the additional by-reference pass of a CFDictionaryRef containing
244 various error information (see below). The caller is responsible for releasing the
245 returned dictionary. If the error dictionary is not desired, pass NULL. */
246CF_EXPORT
247CFXMLTreeRef CFXMLTreeCreateFromDataWithError(CFAllocatorRef allocator, CFDataRef xmlData, CFURLRef dataSource, CFOptionFlags parseOptions, CFIndex versionOfNodes, CFDictionaryRef *errorDict) AVAILABLE_MAC_OS_X_VERSION_10_3_AND_LATER;
248
249
250/* Generate the XMLData (ready to be written to whatever permanent storage is to be
251 used) from an CFXMLTree. Will NOT regenerate entity references (except those
252 required for syntactic correctness) if they were replaced at the parse time;
253 clients that wish this should walk the tree and re-insert any entity references
254 that should appear in the final output file. */
255CF_EXPORT
256CFDataRef CFXMLTreeCreateXMLData(CFAllocatorRef allocator, CFXMLTreeRef xmlTree);
257
258/* Escaping and unescaping XML entities in CFStrings. The standard XML entities
259 are always replaced. */
260/* Creates a CFString by replacing entities that appear in the entities dictionary.
261 Dictionary keys are the entities themselves, and the values should be CFStrings
262 containing the expansion. Pass NULL for entitiesDictionary to indicate no entities
263 other than the standard five. */
264CF_EXPORT
265CFStringRef CFXMLCreateStringByEscapingEntities(CFAllocatorRef allocator, CFStringRef string, CFDictionaryRef entitiesDictionary) AVAILABLE_MAC_OS_X_VERSION_10_3_AND_LATER;
266
267CF_EXPORT
268CFStringRef CFXMLCreateStringByUnescapingEntities(CFAllocatorRef allocator, CFStringRef string, CFDictionaryRef entitiesDictionary) AVAILABLE_MAC_OS_X_VERSION_10_3_AND_LATER;
269
270/* CFXMLTreeCreateFromDataWithError error dictionary key constants. */
271CF_EXPORT const CFStringRef kCFXMLTreeErrorDescription AVAILABLE_MAC_OS_X_VERSION_10_3_AND_LATER;
272 /* value is a CFString containing the readable error string. */
273
274CF_EXPORT const CFStringRef kCFXMLTreeErrorLineNumber AVAILABLE_MAC_OS_X_VERSION_10_3_AND_LATER;
275 /* value is a CFNumber containing the line on which the error appears. */
276
277CF_EXPORT const CFStringRef kCFXMLTreeErrorLocation AVAILABLE_MAC_OS_X_VERSION_10_3_AND_LATER;
278 /* value is a CFNumber containing the byte location at which the error occurred. */
279
280CF_EXPORT const CFStringRef kCFXMLTreeErrorStatusCode AVAILABLE_MAC_OS_X_VERSION_10_3_AND_LATER;
281 /* value is a CFNumber containing the error status code. */
282
283#if defined(__cplusplus)
284}
285#endif
286
287#endif /* ! __COREFOUNDATION_CFXMLPARSER__ */
288