1347
|
1 /*
|
|
2 The contents of this file are subject to the Mozilla Public License
|
|
3 Version 1.1 (the "License"); you may not use this file except in
|
|
4 compliance with the License. You may obtain a copy of the License at
|
|
5 http://www.mozilla.org/MPL/
|
|
6
|
|
7 Software distributed under the License is distributed on an "AS IS"
|
|
8 basis, WITHOUT WARRANTY OF ANY KIND, either express or implied. See the
|
|
9 License for the specific language governing rights and limitations
|
|
10 under the License.
|
|
11
|
|
12 The Original Code is expat.
|
|
13
|
|
14 The Initial Developer of the Original Code is James Clark.
|
|
15 Portions created by James Clark are Copyright (C) 1998, 1999
|
|
16 James Clark. All Rights Reserved.
|
|
17
|
|
18 Contributor(s):
|
|
19
|
|
20 Alternatively, the contents of this file may be used under the terms
|
|
21 of the GNU General Public License (the "GPL"), in which case the
|
|
22 provisions of the GPL are applicable instead of those above. If you
|
|
23 wish to allow use of your version of this file only under the terms of
|
|
24 the GPL and not to allow others to use your version of this file under
|
|
25 the MPL, indicate your decision by deleting the provisions above and
|
|
26 replace them with the notice and other provisions required by the
|
|
27 GPL. If you do not delete the provisions above, a recipient may use
|
|
28 your version of this file under either the MPL or the GPL.
|
|
29 */
|
|
30
|
|
31 #include "xmldef.h"
|
|
32 #include "xmlparse.h"
|
|
33
|
|
34 #ifdef XML_UNICODE
|
|
35 #define XML_ENCODE_MAX XML_UTF16_ENCODE_MAX
|
|
36 #define XmlConvert XmlUtf16Convert
|
|
37 #define XmlGetInternalEncoding XmlGetUtf16InternalEncoding
|
|
38 #define XmlGetInternalEncodingNS XmlGetUtf16InternalEncodingNS
|
|
39 #define XmlEncode XmlUtf16Encode
|
|
40 #define MUST_CONVERT(enc, s) (!(enc)->isUtf16 || (((unsigned long)s) & 1))
|
|
41 typedef unsigned short ICHAR;
|
|
42 #else
|
|
43 #define XML_ENCODE_MAX XML_UTF8_ENCODE_MAX
|
|
44 #define XmlConvert XmlUtf8Convert
|
|
45 #define XmlGetInternalEncoding XmlGetUtf8InternalEncoding
|
|
46 #define XmlGetInternalEncodingNS XmlGetUtf8InternalEncodingNS
|
|
47 #define XmlEncode XmlUtf8Encode
|
|
48 #define MUST_CONVERT(enc, s) (!(enc)->isUtf8)
|
|
49 typedef char ICHAR;
|
|
50 #endif
|
|
51
|
|
52
|
|
53 #ifndef XML_NS
|
|
54
|
|
55 #define XmlInitEncodingNS XmlInitEncoding
|
|
56 #define XmlInitUnknownEncodingNS XmlInitUnknownEncoding
|
|
57 #undef XmlGetInternalEncodingNS
|
|
58 #define XmlGetInternalEncodingNS XmlGetInternalEncoding
|
|
59 #define XmlParseXmlDeclNS XmlParseXmlDecl
|
|
60
|
|
61 #endif
|
|
62
|
|
63
|
|
64 #ifdef XML_UNICODE_WCHAR_T
|
|
65 #define XML_T(x) L ## x
|
|
66 #else
|
|
67 #define XML_T(x) x
|
|
68 #endif
|
|
69
|
|
70 /* Round up n to be a multiple of sz, where sz is a power of 2. */
|
|
71 #define ROUND_UP(n, sz) (((n) + ((sz) - 1)) & ~((sz) - 1))
|
|
72
|
|
73 #include "xmltok.h"
|
|
74 #include "xmlrole.h"
|
|
75 #include "hashtable.h"
|
|
76
|
|
77 #define INIT_TAG_BUF_SIZE 32 /* must be a multiple of sizeof(XML_Char) */
|
|
78 #define INIT_DATA_BUF_SIZE 1024
|
|
79 #define INIT_ATTS_SIZE 16
|
|
80 #define INIT_BLOCK_SIZE 1024
|
|
81 #define INIT_BUFFER_SIZE 1024
|
|
82
|
|
83 #define EXPAND_SPARE 24
|
|
84
|
|
85 typedef struct binding {
|
|
86 struct prefix *prefix;
|
|
87 struct binding *nextTagBinding;
|
|
88 struct binding *prevPrefixBinding;
|
|
89 const struct attribute_id *attId;
|
|
90 XML_Char *uri;
|
|
91 int uriLen;
|
|
92 int uriAlloc;
|
|
93 } BINDING;
|
|
94
|
|
95 typedef struct prefix {
|
|
96 const XML_Char *name;
|
|
97 BINDING *binding;
|
|
98 } PREFIX;
|
|
99
|
|
100 typedef struct {
|
|
101 const XML_Char *str;
|
|
102 const XML_Char *localPart;
|
|
103 int uriLen;
|
|
104 } TAG_NAME;
|
|
105
|
|
106 typedef struct tag {
|
|
107 struct tag *parent;
|
|
108 const char *rawName;
|
|
109 int rawNameLength;
|
|
110 TAG_NAME name;
|
|
111 char *buf;
|
|
112 char *bufEnd;
|
|
113 BINDING *bindings;
|
|
114 } TAG;
|
|
115
|
|
116 typedef struct {
|
|
117 const XML_Char *name;
|
|
118 const XML_Char *textPtr;
|
|
119 int textLen;
|
|
120 const XML_Char *systemId;
|
|
121 const XML_Char *base;
|
|
122 const XML_Char *publicId;
|
|
123 const XML_Char *notation;
|
|
124 char open;
|
|
125 } ENTITY;
|
|
126
|
|
127 typedef struct block {
|
|
128 struct block *next;
|
|
129 int size;
|
|
130 XML_Char s[1];
|
|
131 } BLOCK;
|
|
132
|
|
133 typedef struct {
|
|
134 BLOCK *blocks;
|
|
135 BLOCK *freeBlocks;
|
|
136 const XML_Char *end;
|
|
137 XML_Char *ptr;
|
|
138 XML_Char *start;
|
|
139 } STRING_POOL;
|
|
140
|
|
141 /* The XML_Char before the name is used to determine whether
|
|
142 an attribute has been specified. */
|
|
143 typedef struct attribute_id {
|
|
144 XML_Char *name;
|
|
145 PREFIX *prefix;
|
|
146 char maybeTokenized;
|
|
147 char xmlns;
|
|
148 } ATTRIBUTE_ID;
|
|
149
|
|
150 typedef struct {
|
|
151 const ATTRIBUTE_ID *id;
|
|
152 char isCdata;
|
|
153 const XML_Char *value;
|
|
154 } DEFAULT_ATTRIBUTE;
|
|
155
|
|
156 typedef struct {
|
|
157 const XML_Char *name;
|
|
158 PREFIX *prefix;
|
|
159 int nDefaultAtts;
|
|
160 int allocDefaultAtts;
|
|
161 DEFAULT_ATTRIBUTE *defaultAtts;
|
|
162 } ELEMENT_TYPE;
|
|
163
|
|
164 typedef struct {
|
|
165 HASH_TABLE generalEntities;
|
|
166 HASH_TABLE elementTypes;
|
|
167 HASH_TABLE attributeIds;
|
|
168 HASH_TABLE prefixes;
|
|
169 STRING_POOL pool;
|
|
170 int complete;
|
|
171 int standalone;
|
|
172 const XML_Char *base;
|
|
173 PREFIX defaultPrefix;
|
|
174 } DTD;
|
|
175
|
|
176 typedef struct open_internal_entity {
|
|
177 const char *internalEventPtr;
|
|
178 const char *internalEventEndPtr;
|
|
179 struct open_internal_entity *next;
|
|
180 ENTITY *entity;
|
|
181 } OPEN_INTERNAL_ENTITY;
|
|
182
|
|
183 typedef enum XML_Error Processor(XML_Parser parser,
|
|
184 const char *start,
|
|
185 const char *end,
|
|
186 const char **endPtr);
|
|
187
|
|
188 static Processor prologProcessor;
|
|
189 static Processor prologInitProcessor;
|
|
190 static Processor contentProcessor;
|
|
191 static Processor cdataSectionProcessor;
|
|
192 static Processor epilogProcessor;
|
|
193 static Processor errorProcessor;
|
|
194 static Processor externalEntityInitProcessor;
|
|
195 static Processor externalEntityInitProcessor2;
|
|
196 static Processor externalEntityInitProcessor3;
|
|
197 static Processor externalEntityContentProcessor;
|
|
198
|
|
199 static enum XML_Error
|
|
200 handleUnknownEncoding(XML_Parser parser, const XML_Char *encodingName);
|
|
201 static enum XML_Error
|
|
202 processXmlDecl(XML_Parser parser, int isGeneralTextEntity, const char *, const char *);
|
|
203 static enum XML_Error
|
|
204 initializeEncoding(XML_Parser parser);
|
|
205 static enum XML_Error
|
|
206 doContent(XML_Parser parser, int startTagLevel, const ENCODING *enc,
|
|
207 const char *start, const char *end, const char **endPtr);
|
|
208 static enum XML_Error
|
|
209 doCdataSection(XML_Parser parser, const ENCODING *, const char **startPtr, const char *end, const char **nextPtr);
|
|
210 static enum XML_Error storeAtts(XML_Parser parser, const ENCODING *, const char *s,
|
|
211 TAG_NAME *tagNamePtr, BINDING **bindingsPtr);
|
|
212 static
|
|
213 int addBinding(XML_Parser parser, PREFIX *prefix, const ATTRIBUTE_ID *attId, const XML_Char *uri, BINDING **bindingsPtr);
|
|
214 static int
|
|
215 defineAttribute(ELEMENT_TYPE *type, ATTRIBUTE_ID *, int isCdata, const XML_Char *dfltValue);
|
|
216 static enum XML_Error
|
|
217 storeAttributeValue(XML_Parser parser, const ENCODING *, int isCdata, const char *, const char *,
|
|
218 STRING_POOL *);
|
|
219 static enum XML_Error
|
|
220 appendAttributeValue(XML_Parser parser, const ENCODING *, int isCdata, const char *, const char *,
|
|
221 STRING_POOL *);
|
|
222 static ATTRIBUTE_ID *
|
|
223 getAttributeId(XML_Parser parser, const ENCODING *enc, const char *start, const char *end);
|
|
224 static int setElementTypePrefix(XML_Parser parser, ELEMENT_TYPE *);
|
|
225 static enum XML_Error
|
|
226 storeEntityValue(XML_Parser parser, const char *start, const char *end);
|
|
227 static int
|
|
228 reportProcessingInstruction(XML_Parser parser, const ENCODING *enc, const char *start, const char *end);
|
|
229 static int
|
|
230 reportComment(XML_Parser parser, const ENCODING *enc, const char *start, const char *end);
|
|
231 static void
|
|
232 reportDefault(XML_Parser parser, const ENCODING *enc, const char *start, const char *end);
|
|
233
|
|
234 static const XML_Char *getContext(XML_Parser parser);
|
|
235 static int setContext(XML_Parser parser, const XML_Char *context);
|
|
236 static void normalizePublicId(XML_Char *s);
|
|
237 static int dtdInit(DTD *);
|
|
238 static void dtdDestroy(DTD *);
|
|
239 static int dtdCopy(DTD *newDtd, const DTD *oldDtd);
|
|
240 static void poolInit(STRING_POOL *);
|
|
241 static void poolClear(STRING_POOL *);
|
|
242 static void poolDestroy(STRING_POOL *);
|
|
243 static XML_Char *poolAppend(STRING_POOL *pool, const ENCODING *enc,
|
|
244 const char *ptr, const char *end);
|
|
245 static XML_Char *poolStoreString(STRING_POOL *pool, const ENCODING *enc,
|
|
246 const char *ptr, const char *end);
|
|
247 static int poolGrow(STRING_POOL *pool);
|
|
248 static const XML_Char *poolCopyString(STRING_POOL *pool, const XML_Char *s);
|
|
249 static const XML_Char *poolCopyStringN(STRING_POOL *pool, const XML_Char *s, int n);
|
|
250
|
|
251 #define poolStart(pool) ((pool)->start)
|
|
252 #define poolEnd(pool) ((pool)->ptr)
|
|
253 #define poolLength(pool) ((pool)->ptr - (pool)->start)
|
|
254 #define poolChop(pool) ((void)--(pool->ptr))
|
|
255 #define poolLastChar(pool) (((pool)->ptr)[-1])
|
|
256 #define poolDiscard(pool) ((pool)->ptr = (pool)->start)
|
|
257 #define poolFinish(pool) ((pool)->start = (pool)->ptr)
|
|
258 #define poolAppendChar(pool, c) \
|
|
259 (((pool)->ptr == (pool)->end && !poolGrow(pool)) \
|
|
260 ? 0 \
|
|
261 : ((*((pool)->ptr)++ = c), 1))
|
|
262
|
|
263 typedef struct {
|
|
264 /* The first member must be userData so that the XML_GetUserData macro works. */
|
|
265 void *m_userData;
|
|
266 void *m_handlerArg;
|
|
267 char *m_buffer;
|
|
268 /* first character to be parsed */
|
|
269 const char *m_bufferPtr;
|
|
270 /* past last character to be parsed */
|
|
271 char *m_bufferEnd;
|
|
272 /* allocated end of buffer */
|
|
273 const char *m_bufferLim;
|
|
274 long m_parseEndByteIndex;
|
|
275 const char *m_parseEndPtr;
|
|
276 XML_Char *m_dataBuf;
|
|
277 XML_Char *m_dataBufEnd;
|
|
278 XML_StartElementHandler m_startElementHandler;
|
|
279 XML_EndElementHandler m_endElementHandler;
|
|
280 XML_CharacterDataHandler m_characterDataHandler;
|
|
281 XML_ProcessingInstructionHandler m_processingInstructionHandler;
|
|
282 XML_CommentHandler m_commentHandler;
|
|
283 XML_StartCdataSectionHandler m_startCdataSectionHandler;
|
|
284 XML_EndCdataSectionHandler m_endCdataSectionHandler;
|
|
285 XML_DefaultHandler m_defaultHandler;
|
|
286 XML_UnparsedEntityDeclHandler m_unparsedEntityDeclHandler;
|
|
287 XML_NotationDeclHandler m_notationDeclHandler;
|
|
288 XML_StartNamespaceDeclHandler m_startNamespaceDeclHandler;
|
|
289 XML_EndNamespaceDeclHandler m_endNamespaceDeclHandler;
|
|
290 XML_NotStandaloneHandler m_notStandaloneHandler;
|
|
291 XML_ExternalEntityRefHandler m_externalEntityRefHandler;
|
|
292 void *m_externalEntityRefHandlerArg;
|
|
293 XML_UnknownEncodingHandler m_unknownEncodingHandler;
|
|
294 const ENCODING *m_encoding;
|
|
295 INIT_ENCODING m_initEncoding;
|
|
296 const XML_Char *m_protocolEncodingName;
|
|
297 int m_ns;
|
|
298 void *m_unknownEncodingMem;
|
|
299 void *m_unknownEncodingData;
|
|
300 void *m_unknownEncodingHandlerData;
|
|
301 void (*m_unknownEncodingRelease)(void *);
|
|
302 PROLOG_STATE m_prologState;
|
|
303 Processor *m_processor;
|
|
304 enum XML_Error m_errorCode;
|
|
305 const char *m_eventPtr;
|
|
306 const char *m_eventEndPtr;
|
|
307 const char *m_positionPtr;
|
|
308 OPEN_INTERNAL_ENTITY *m_openInternalEntities;
|
|
309 int m_defaultExpandInternalEntities;
|
|
310 int m_tagLevel;
|
|
311 ENTITY *m_declEntity;
|
|
312 const XML_Char *m_declNotationName;
|
|
313 const XML_Char *m_declNotationPublicId;
|
|
314 ELEMENT_TYPE *m_declElementType;
|
|
315 ATTRIBUTE_ID *m_declAttributeId;
|
|
316 char m_declAttributeIsCdata;
|
|
317 DTD m_dtd;
|
|
318 TAG *m_tagStack;
|
|
319 TAG *m_freeTagList;
|
|
320 BINDING *m_inheritedBindings;
|
|
321 BINDING *m_freeBindingList;
|
|
322 int m_attsSize;
|
|
323 int m_nSpecifiedAtts;
|
|
324 ATTRIBUTE *m_atts;
|
|
325 POSITION m_position;
|
|
326 STRING_POOL m_tempPool;
|
|
327 STRING_POOL m_temp2Pool;
|
|
328 char *m_groupConnector;
|
|
329 unsigned m_groupSize;
|
|
330 int m_hadExternalDoctype;
|
|
331 XML_Char m_namespaceSeparator;
|
|
332 } Parser;
|
|
333
|
|
334 #define userData (((Parser *)parser)->m_userData)
|
|
335 #define handlerArg (((Parser *)parser)->m_handlerArg)
|
|
336 #define startElementHandler (((Parser *)parser)->m_startElementHandler)
|
|
337 #define endElementHandler (((Parser *)parser)->m_endElementHandler)
|
|
338 #define characterDataHandler (((Parser *)parser)->m_characterDataHandler)
|
|
339 #define processingInstructionHandler (((Parser *)parser)->m_processingInstructionHandler)
|
|
340 #define commentHandler (((Parser *)parser)->m_commentHandler)
|
|
341 #define startCdataSectionHandler (((Parser *)parser)->m_startCdataSectionHandler)
|
|
342 #define endCdataSectionHandler (((Parser *)parser)->m_endCdataSectionHandler)
|
|
343 #define defaultHandler (((Parser *)parser)->m_defaultHandler)
|
|
344 #define unparsedEntityDeclHandler (((Parser *)parser)->m_unparsedEntityDeclHandler)
|
|
345 #define notationDeclHandler (((Parser *)parser)->m_notationDeclHandler)
|
|
346 #define startNamespaceDeclHandler (((Parser *)parser)->m_startNamespaceDeclHandler)
|
|
347 #define endNamespaceDeclHandler (((Parser *)parser)->m_endNamespaceDeclHandler)
|
|
348 #define notStandaloneHandler (((Parser *)parser)->m_notStandaloneHandler)
|
|
349 #define externalEntityRefHandler (((Parser *)parser)->m_externalEntityRefHandler)
|
|
350 #define externalEntityRefHandlerArg (((Parser *)parser)->m_externalEntityRefHandlerArg)
|
|
351 #define unknownEncodingHandler (((Parser *)parser)->m_unknownEncodingHandler)
|
|
352 #define encoding (((Parser *)parser)->m_encoding)
|
|
353 #define initEncoding (((Parser *)parser)->m_initEncoding)
|
|
354 #define unknownEncodingMem (((Parser *)parser)->m_unknownEncodingMem)
|
|
355 #define unknownEncodingData (((Parser *)parser)->m_unknownEncodingData)
|
|
356 #define unknownEncodingHandlerData \
|
|
357 (((Parser *)parser)->m_unknownEncodingHandlerData)
|
|
358 #define unknownEncodingRelease (((Parser *)parser)->m_unknownEncodingRelease)
|
|
359 #define protocolEncodingName (((Parser *)parser)->m_protocolEncodingName)
|
|
360 #define ns (((Parser *)parser)->m_ns)
|
|
361 #define prologState (((Parser *)parser)->m_prologState)
|
|
362 #define processor (((Parser *)parser)->m_processor)
|
|
363 #define errorCode (((Parser *)parser)->m_errorCode)
|
|
364 #define eventPtr (((Parser *)parser)->m_eventPtr)
|
|
365 #define eventEndPtr (((Parser *)parser)->m_eventEndPtr)
|
|
366 #define positionPtr (((Parser *)parser)->m_positionPtr)
|
|
367 #define position (((Parser *)parser)->m_position)
|
|
368 #define openInternalEntities (((Parser *)parser)->m_openInternalEntities)
|
|
369 #define defaultExpandInternalEntities (((Parser *)parser)->m_defaultExpandInternalEntities)
|
|
370 #define tagLevel (((Parser *)parser)->m_tagLevel)
|
|
371 #define buffer (((Parser *)parser)->m_buffer)
|
|
372 #define bufferPtr (((Parser *)parser)->m_bufferPtr)
|
|
373 #define bufferEnd (((Parser *)parser)->m_bufferEnd)
|
|
374 #define parseEndByteIndex (((Parser *)parser)->m_parseEndByteIndex)
|
|
375 #define parseEndPtr (((Parser *)parser)->m_parseEndPtr)
|
|
376 #define bufferLim (((Parser *)parser)->m_bufferLim)
|
|
377 #define dataBuf (((Parser *)parser)->m_dataBuf)
|
|
378 #define dataBufEnd (((Parser *)parser)->m_dataBufEnd)
|
|
379 #define dtd (((Parser *)parser)->m_dtd)
|
|
380 #define declEntity (((Parser *)parser)->m_declEntity)
|
|
381 #define declNotationName (((Parser *)parser)->m_declNotationName)
|
|
382 #define declNotationPublicId (((Parser *)parser)->m_declNotationPublicId)
|
|
383 #define declElementType (((Parser *)parser)->m_declElementType)
|
|
384 #define declAttributeId (((Parser *)parser)->m_declAttributeId)
|
|
385 #define declAttributeIsCdata (((Parser *)parser)->m_declAttributeIsCdata)
|
|
386 #define freeTagList (((Parser *)parser)->m_freeTagList)
|
|
387 #define freeBindingList (((Parser *)parser)->m_freeBindingList)
|
|
388 #define inheritedBindings (((Parser *)parser)->m_inheritedBindings)
|
|
389 #define tagStack (((Parser *)parser)->m_tagStack)
|
|
390 #define atts (((Parser *)parser)->m_atts)
|
|
391 #define attsSize (((Parser *)parser)->m_attsSize)
|
|
392 #define nSpecifiedAtts (((Parser *)parser)->m_nSpecifiedAtts)
|
|
393 #define tempPool (((Parser *)parser)->m_tempPool)
|
|
394 #define temp2Pool (((Parser *)parser)->m_temp2Pool)
|
|
395 #define groupConnector (((Parser *)parser)->m_groupConnector)
|
|
396 #define groupSize (((Parser *)parser)->m_groupSize)
|
|
397 #define hadExternalDoctype (((Parser *)parser)->m_hadExternalDoctype)
|
|
398 #define namespaceSeparator (((Parser *)parser)->m_namespaceSeparator)
|
|
399
|
|
400 #ifdef _MSC_VER
|
|
401 #ifdef _DEBUG
|
|
402 Parser *asParser(XML_Parser parser)
|
|
403 {
|
|
404 return parser;
|
|
405 }
|
|
406 #endif
|
|
407 #endif
|
|
408
|
|
409 XML_Parser XML_ParserCreate(const XML_Char *encodingName)
|
|
410 {
|
|
411 XML_Parser parser = malloc(sizeof(Parser));
|
|
412 if (!parser)
|
|
413 return parser;
|
|
414 processor = prologInitProcessor;
|
|
415 XmlPrologStateInit(&prologState);
|
|
416 userData = 0;
|
|
417 handlerArg = 0;
|
|
418 startElementHandler = 0;
|
|
419 endElementHandler = 0;
|
|
420 characterDataHandler = 0;
|
|
421 processingInstructionHandler = 0;
|
|
422 commentHandler = 0;
|
|
423 startCdataSectionHandler = 0;
|
|
424 endCdataSectionHandler = 0;
|
|
425 defaultHandler = 0;
|
|
426 unparsedEntityDeclHandler = 0;
|
|
427 notationDeclHandler = 0;
|
|
428 startNamespaceDeclHandler = 0;
|
|
429 endNamespaceDeclHandler = 0;
|
|
430 notStandaloneHandler = 0;
|
|
431 externalEntityRefHandler = 0;
|
|
432 externalEntityRefHandlerArg = parser;
|
|
433 unknownEncodingHandler = 0;
|
|
434 buffer = 0;
|
|
435 bufferPtr = 0;
|
|
436 bufferEnd = 0;
|
|
437 parseEndByteIndex = 0;
|
|
438 parseEndPtr = 0;
|
|
439 bufferLim = 0;
|
|
440 declElementType = 0;
|
|
441 declAttributeId = 0;
|
|
442 declEntity = 0;
|
|
443 declNotationName = 0;
|
|
444 declNotationPublicId = 0;
|
|
445 memset(&position, 0, sizeof(POSITION));
|
|
446 errorCode = XML_ERROR_NONE;
|
|
447 eventPtr = 0;
|
|
448 eventEndPtr = 0;
|
|
449 positionPtr = 0;
|
|
450 openInternalEntities = 0;
|
|
451 tagLevel = 0;
|
|
452 tagStack = 0;
|
|
453 freeTagList = 0;
|
|
454 freeBindingList = 0;
|
|
455 inheritedBindings = 0;
|
|
456 attsSize = INIT_ATTS_SIZE;
|
|
457 atts = malloc(attsSize * sizeof(ATTRIBUTE));
|
|
458 nSpecifiedAtts = 0;
|
|
459 dataBuf = malloc(INIT_DATA_BUF_SIZE * sizeof(XML_Char));
|
|
460 groupSize = 0;
|
|
461 groupConnector = 0;
|
|
462 hadExternalDoctype = 0;
|
|
463 unknownEncodingMem = 0;
|
|
464 unknownEncodingRelease = 0;
|
|
465 unknownEncodingData = 0;
|
|
466 unknownEncodingHandlerData = 0;
|
|
467 namespaceSeparator = '!';
|
|
468 ns = 0;
|
|
469 poolInit(&tempPool);
|
|
470 poolInit(&temp2Pool);
|
|
471 protocolEncodingName = encodingName ? poolCopyString(&tempPool, encodingName) : 0;
|
|
472 if (!dtdInit(&dtd) || !atts || !dataBuf
|
|
473 || (encodingName && !protocolEncodingName)) {
|
|
474 XML_ParserFree(parser);
|
|
475 return 0;
|
|
476 }
|
|
477 dataBufEnd = dataBuf + INIT_DATA_BUF_SIZE;
|
|
478 XmlInitEncoding(&initEncoding, &encoding, 0);
|
|
479 return parser;
|
|
480 }
|
|
481
|
|
482 XML_Parser XML_ParserCreateNS(const XML_Char *encodingName, XML_Char nsSep)
|
|
483 {
|
|
484 static
|
|
485 const XML_Char implicitContext[] = {
|
|
486 XML_T('x'), XML_T('m'), XML_T('l'), XML_T('='),
|
|
487 XML_T('h'), XML_T('t'), XML_T('t'), XML_T('p'), XML_T(':'),
|
|
488 XML_T('/'), XML_T('/'), XML_T('w'), XML_T('w'), XML_T('w'),
|
|
489 XML_T('.'), XML_T('w'), XML_T('3'),
|
|
490 XML_T('.'), XML_T('o'), XML_T('r'), XML_T('g'),
|
|
491 XML_T('/'), XML_T('X'), XML_T('M'), XML_T('L'),
|
|
492 XML_T('/'), XML_T('1'), XML_T('9'), XML_T('9'), XML_T('8'),
|
|
493 XML_T('/'), XML_T('n'), XML_T('a'), XML_T('m'), XML_T('e'),
|
|
494 XML_T('s'), XML_T('p'), XML_T('a'), XML_T('c'), XML_T('e'),
|
|
495 XML_T('\0')
|
|
496 };
|
|
497
|
|
498 XML_Parser parser = XML_ParserCreate(encodingName);
|
|
499 if (parser) {
|
|
500 XmlInitEncodingNS(&initEncoding, &encoding, 0);
|
|
501 ns = 1;
|
|
502 namespaceSeparator = nsSep;
|
|
503 }
|
|
504 if (!setContext(parser, implicitContext)) {
|
|
505 XML_ParserFree(parser);
|
|
506 return 0;
|
|
507 }
|
|
508 return parser;
|
|
509 }
|
|
510
|
|
511 int XML_SetEncoding(XML_Parser parser, const XML_Char *encodingName)
|
|
512 {
|
|
513 if (!encodingName)
|
|
514 protocolEncodingName = 0;
|
|
515 else {
|
|
516 protocolEncodingName = poolCopyString(&tempPool, encodingName);
|
|
517 if (!protocolEncodingName)
|
|
518 return 0;
|
|
519 }
|
|
520 return 1;
|
|
521 }
|
|
522
|
|
523 XML_Parser XML_ExternalEntityParserCreate(XML_Parser oldParser,
|
|
524 const XML_Char *context,
|
|
525 const XML_Char *encodingName)
|
|
526 {
|
|
527 XML_Parser parser = oldParser;
|
|
528 DTD *oldDtd = &dtd;
|
|
529 XML_StartElementHandler oldStartElementHandler = startElementHandler;
|
|
530 XML_EndElementHandler oldEndElementHandler = endElementHandler;
|
|
531 XML_CharacterDataHandler oldCharacterDataHandler = characterDataHandler;
|
|
532 XML_ProcessingInstructionHandler oldProcessingInstructionHandler = processingInstructionHandler;
|
|
533 XML_CommentHandler oldCommentHandler = commentHandler;
|
|
534 XML_StartCdataSectionHandler oldStartCdataSectionHandler = startCdataSectionHandler;
|
|
535 XML_EndCdataSectionHandler oldEndCdataSectionHandler = endCdataSectionHandler;
|
|
536 XML_DefaultHandler oldDefaultHandler = defaultHandler;
|
|
537 XML_StartNamespaceDeclHandler oldStartNamespaceDeclHandler = startNamespaceDeclHandler;
|
|
538 XML_EndNamespaceDeclHandler oldEndNamespaceDeclHandler = endNamespaceDeclHandler;
|
|
539 XML_NotStandaloneHandler oldNotStandaloneHandler = notStandaloneHandler;
|
|
540 XML_ExternalEntityRefHandler oldExternalEntityRefHandler = externalEntityRefHandler;
|
|
541 XML_UnknownEncodingHandler oldUnknownEncodingHandler = unknownEncodingHandler;
|
|
542 void *oldUserData = userData;
|
|
543 void *oldHandlerArg = handlerArg;
|
|
544 int oldDefaultExpandInternalEntities = defaultExpandInternalEntities;
|
|
545 void *oldExternalEntityRefHandlerArg = externalEntityRefHandlerArg;
|
|
546
|
|
547 parser = (ns
|
|
548 ? XML_ParserCreateNS(encodingName, namespaceSeparator)
|
|
549 : XML_ParserCreate(encodingName));
|
|
550 if (!parser)
|
|
551 return 0;
|
|
552 startElementHandler = oldStartElementHandler;
|
|
553 endElementHandler = oldEndElementHandler;
|
|
554 characterDataHandler = oldCharacterDataHandler;
|
|
555 processingInstructionHandler = oldProcessingInstructionHandler;
|
|
556 commentHandler = oldCommentHandler;
|
|
557 startCdataSectionHandler = oldStartCdataSectionHandler;
|
|
558 endCdataSectionHandler = oldEndCdataSectionHandler;
|
|
559 defaultHandler = oldDefaultHandler;
|
|
560 startNamespaceDeclHandler = oldStartNamespaceDeclHandler;
|
|
561 endNamespaceDeclHandler = oldEndNamespaceDeclHandler;
|
|
562 notStandaloneHandler = oldNotStandaloneHandler;
|
|
563 externalEntityRefHandler = oldExternalEntityRefHandler;
|
|
564 unknownEncodingHandler = oldUnknownEncodingHandler;
|
|
565 userData = oldUserData;
|
|
566 if (oldUserData == oldHandlerArg)
|
|
567 handlerArg = userData;
|
|
568 else
|
|
569 handlerArg = parser;
|
|
570 if (oldExternalEntityRefHandlerArg != oldParser)
|
|
571 externalEntityRefHandlerArg = oldExternalEntityRefHandlerArg;
|
|
572 defaultExpandInternalEntities = oldDefaultExpandInternalEntities;
|
|
573 if (!dtdCopy(&dtd, oldDtd) || !setContext(parser, context)) {
|
|
574 XML_ParserFree(parser);
|
|
575 return 0;
|
|
576 }
|
|
577 processor = externalEntityInitProcessor;
|
|
578 return parser;
|
|
579 }
|
|
580
|
|
581 static
|
|
582 void destroyBindings(BINDING *bindings)
|
|
583 {
|
|
584 for (;;) {
|
|
585 BINDING *b = bindings;
|
|
586 if (!b)
|
|
587 break;
|
|
588 bindings = b->nextTagBinding;
|
|
589 free(b->uri);
|
|
590 free(b);
|
|
591 }
|
|
592 }
|
|
593
|
|
594 void XML_ParserFree(XML_Parser parser)
|
|
595 {
|
|
596 for (;;) {
|
|
597 TAG *p;
|
|
598 if (tagStack == 0) {
|
|
599 if (freeTagList == 0)
|
|
600 break;
|
|
601 tagStack = freeTagList;
|
|
602 freeTagList = 0;
|
|
603 }
|
|
604 p = tagStack;
|
|
605 tagStack = tagStack->parent;
|
|
606 free(p->buf);
|
|
607 destroyBindings(p->bindings);
|
|
608 free(p);
|
|
609 }
|
|
610 destroyBindings(freeBindingList);
|
|
611 destroyBindings(inheritedBindings);
|
|
612 poolDestroy(&tempPool);
|
|
613 poolDestroy(&temp2Pool);
|
|
614 dtdDestroy(&dtd);
|
|
615 free((void *)atts);
|
|
616 free(groupConnector);
|
|
617 free(buffer);
|
|
618 free(dataBuf);
|
|
619 free(unknownEncodingMem);
|
|
620 if (unknownEncodingRelease)
|
|
621 unknownEncodingRelease(unknownEncodingData);
|
|
622 free(parser);
|
|
623 }
|
|
624
|
|
625 void XML_UseParserAsHandlerArg(XML_Parser parser)
|
|
626 {
|
|
627 handlerArg = parser;
|
|
628 }
|
|
629
|
|
630 void XML_SetUserData(XML_Parser parser, void *p)
|
|
631 {
|
|
632 if (handlerArg == userData)
|
|
633 handlerArg = userData = p;
|
|
634 else
|
|
635 userData = p;
|
|
636 }
|
|
637
|
|
638 int XML_SetBase(XML_Parser parser, const XML_Char *p)
|
|
639 {
|
|
640 if (p) {
|
|
641 p = poolCopyString(&dtd.pool, p);
|
|
642 if (!p)
|
|
643 return 0;
|
|
644 dtd.base = p;
|
|
645 }
|
|
646 else
|
|
647 dtd.base = 0;
|
|
648 return 1;
|
|
649 }
|
|
650
|
|
651 const XML_Char *XML_GetBase(XML_Parser parser)
|
|
652 {
|
|
653 return dtd.base;
|
|
654 }
|
|
655
|
|
656 int XML_GetSpecifiedAttributeCount(XML_Parser parser)
|
|
657 {
|
|
658 return nSpecifiedAtts;
|
|
659 }
|
|
660
|
|
661 void XML_SetElementHandler(XML_Parser parser,
|
|
662 XML_StartElementHandler start,
|
|
663 XML_EndElementHandler end)
|
|
664 {
|
|
665 startElementHandler = start;
|
|
666 endElementHandler = end;
|
|
667 }
|
|
668
|
|
669 void XML_SetCharacterDataHandler(XML_Parser parser,
|
|
670 XML_CharacterDataHandler handler)
|
|
671 {
|
|
672 characterDataHandler = handler;
|
|
673 }
|
|
674
|
|
675 void XML_SetProcessingInstructionHandler(XML_Parser parser,
|
|
676 XML_ProcessingInstructionHandler handler)
|
|
677 {
|
|
678 processingInstructionHandler = handler;
|
|
679 }
|
|
680
|
|
681 void XML_SetCommentHandler(XML_Parser parser,
|
|
682 XML_CommentHandler handler)
|
|
683 {
|
|
684 commentHandler = handler;
|
|
685 }
|
|
686
|
|
687 void XML_SetCdataSectionHandler(XML_Parser parser,
|
|
688 XML_StartCdataSectionHandler start,
|
|
689 XML_EndCdataSectionHandler end)
|
|
690 {
|
|
691 startCdataSectionHandler = start;
|
|
692 endCdataSectionHandler = end;
|
|
693 }
|
|
694
|
|
695 void XML_SetDefaultHandler(XML_Parser parser,
|
|
696 XML_DefaultHandler handler)
|
|
697 {
|
|
698 defaultHandler = handler;
|
|
699 defaultExpandInternalEntities = 0;
|
|
700 }
|
|
701
|
|
702 void XML_SetDefaultHandlerExpand(XML_Parser parser,
|
|
703 XML_DefaultHandler handler)
|
|
704 {
|
|
705 defaultHandler = handler;
|
|
706 defaultExpandInternalEntities = 1;
|
|
707 }
|
|
708
|
|
709 void XML_SetUnparsedEntityDeclHandler(XML_Parser parser,
|
|
710 XML_UnparsedEntityDeclHandler handler)
|
|
711 {
|
|
712 unparsedEntityDeclHandler = handler;
|
|
713 }
|
|
714
|
|
715 void XML_SetNotationDeclHandler(XML_Parser parser,
|
|
716 XML_NotationDeclHandler handler)
|
|
717 {
|
|
718 notationDeclHandler = handler;
|
|
719 }
|
|
720
|
|
721 void XML_SetNamespaceDeclHandler(XML_Parser parser,
|
|
722 XML_StartNamespaceDeclHandler start,
|
|
723 XML_EndNamespaceDeclHandler end)
|
|
724 {
|
|
725 startNamespaceDeclHandler = start;
|
|
726 endNamespaceDeclHandler = end;
|
|
727 }
|
|
728
|
|
729 void XML_SetNotStandaloneHandler(XML_Parser parser,
|
|
730 XML_NotStandaloneHandler handler)
|
|
731 {
|
|
732 notStandaloneHandler = handler;
|
|
733 }
|
|
734
|
|
735 void XML_SetExternalEntityRefHandler(XML_Parser parser,
|
|
736 XML_ExternalEntityRefHandler handler)
|
|
737 {
|
|
738 externalEntityRefHandler = handler;
|
|
739 }
|
|
740
|
|
741 void XML_SetExternalEntityRefHandlerArg(XML_Parser parser, void *arg)
|
|
742 {
|
|
743 if (arg)
|
|
744 externalEntityRefHandlerArg = arg;
|
|
745 else
|
|
746 externalEntityRefHandlerArg = parser;
|
|
747 }
|
|
748
|
|
749 void XML_SetUnknownEncodingHandler(XML_Parser parser,
|
|
750 XML_UnknownEncodingHandler handler,
|
|
751 void *data)
|
|
752 {
|
|
753 unknownEncodingHandler = handler;
|
|
754 unknownEncodingHandlerData = data;
|
|
755 }
|
|
756
|
|
757 int XML_Parse(XML_Parser parser, const char *s, int len, int isFinal)
|
|
758 {
|
|
759 if (len == 0) {
|
|
760 if (!isFinal)
|
|
761 return 1;
|
|
762 positionPtr = bufferPtr;
|
|
763 errorCode = processor(parser, bufferPtr, parseEndPtr = bufferEnd, 0);
|
|
764 if (errorCode == XML_ERROR_NONE)
|
|
765 return 1;
|
|
766 eventEndPtr = eventPtr;
|
|
767 return 0;
|
|
768 }
|
|
769 else if (bufferPtr == bufferEnd) {
|
|
770 const char *end;
|
|
771 int nLeftOver;
|
|
772 parseEndByteIndex += len;
|
|
773 positionPtr = s;
|
|
774 if (isFinal) {
|
|
775 errorCode = processor(parser, s, parseEndPtr = s + len, 0);
|
|
776 if (errorCode == XML_ERROR_NONE)
|
|
777 return 1;
|
|
778 eventEndPtr = eventPtr;
|
|
779 return 0;
|
|
780 }
|
|
781 errorCode = processor(parser, s, parseEndPtr = s + len, &end);
|
|
782 if (errorCode != XML_ERROR_NONE) {
|
|
783 eventEndPtr = eventPtr;
|
|
784 return 0;
|
|
785 }
|
|
786 XmlUpdatePosition(encoding, positionPtr, end, &position);
|
|
787 nLeftOver = s + len - end;
|
|
788 if (nLeftOver) {
|
|
789 if (buffer == 0 || nLeftOver > bufferLim - buffer) {
|
|
790 /* FIXME avoid integer overflow */
|
|
791 buffer = buffer == 0 ? malloc(len * 2) : realloc(buffer, len * 2);
|
|
792 if (!buffer) {
|
|
793 errorCode = XML_ERROR_NO_MEMORY;
|
|
794 eventPtr = eventEndPtr = 0;
|
|
795 return 0;
|
|
796 }
|
|
797 bufferLim = buffer + len * 2;
|
|
798 }
|
|
799 memcpy(buffer, end, nLeftOver);
|
|
800 bufferPtr = buffer;
|
|
801 bufferEnd = buffer + nLeftOver;
|
|
802 }
|
|
803 return 1;
|
|
804 }
|
|
805 else {
|
|
806 memcpy(XML_GetBuffer(parser, len), s, len);
|
|
807 return XML_ParseBuffer(parser, len, isFinal);
|
|
808 }
|
|
809 }
|
|
810
|
|
811 int XML_ParseBuffer(XML_Parser parser, int len, int isFinal)
|
|
812 {
|
|
813 const char *start = bufferPtr;
|
|
814 positionPtr = start;
|
|
815 bufferEnd += len;
|
|
816 parseEndByteIndex += len;
|
|
817 errorCode = processor(parser, start, parseEndPtr = bufferEnd,
|
|
818 isFinal ? (const char **)0 : &bufferPtr);
|
|
819 if (errorCode == XML_ERROR_NONE) {
|
|
820 if (!isFinal)
|
|
821 XmlUpdatePosition(encoding, positionPtr, bufferPtr, &position);
|
|
822 return 1;
|
|
823 }
|
|
824 else {
|
|
825 eventEndPtr = eventPtr;
|
|
826 return 0;
|
|
827 }
|
|
828 }
|
|
829
|
|
830 void *XML_GetBuffer(XML_Parser parser, int len)
|
|
831 {
|
|
832 if (len > bufferLim - bufferEnd) {
|
|
833 /* FIXME avoid integer overflow */
|
|
834 int neededSize = len + (bufferEnd - bufferPtr);
|
|
835 if (neededSize <= bufferLim - buffer) {
|
|
836 memmove(buffer, bufferPtr, bufferEnd - bufferPtr);
|
|
837 bufferEnd = buffer + (bufferEnd - bufferPtr);
|
|
838 bufferPtr = buffer;
|
|
839 }
|
|
840 else {
|
|
841 char *newBuf;
|
|
842 int bufferSize = bufferLim - bufferPtr;
|
|
843 if (bufferSize == 0)
|
|
844 bufferSize = INIT_BUFFER_SIZE;
|
|
845 do {
|
|
846 bufferSize *= 2;
|
|
847 } while (bufferSize < neededSize);
|
|
848 newBuf = malloc(bufferSize);
|
|
849 if (newBuf == 0) {
|
|
850 errorCode = XML_ERROR_NO_MEMORY;
|
|
851 return 0;
|
|
852 }
|
|
853 bufferLim = newBuf + bufferSize;
|
|
854 if (bufferPtr) {
|
|
855 memcpy(newBuf, bufferPtr, bufferEnd - bufferPtr);
|
|
856 free(buffer);
|
|
857 }
|
|
858 bufferEnd = newBuf + (bufferEnd - bufferPtr);
|
|
859 bufferPtr = buffer = newBuf;
|
|
860 }
|
|
861 }
|
|
862 return bufferEnd;
|
|
863 }
|
|
864
|
|
865 enum XML_Error XML_GetErrorCode(XML_Parser parser)
|
|
866 {
|
|
867 return errorCode;
|
|
868 }
|
|
869
|
|
870 long XML_GetCurrentByteIndex(XML_Parser parser)
|
|
871 {
|
|
872 if (eventPtr)
|
|
873 return parseEndByteIndex - (parseEndPtr - eventPtr);
|
|
874 return -1;
|
|
875 }
|
|
876
|
|
877 int XML_GetCurrentByteCount(XML_Parser parser)
|
|
878 {
|
|
879 if (eventEndPtr && eventPtr)
|
|
880 return eventEndPtr - eventPtr;
|
|
881 return 0;
|
|
882 }
|
|
883
|
|
884 int XML_GetCurrentLineNumber(XML_Parser parser)
|
|
885 {
|
|
886 if (eventPtr) {
|
|
887 XmlUpdatePosition(encoding, positionPtr, eventPtr, &position);
|
|
888 positionPtr = eventPtr;
|
|
889 }
|
|
890 return position.lineNumber + 1;
|
|
891 }
|
|
892
|
|
893 int XML_GetCurrentColumnNumber(XML_Parser parser)
|
|
894 {
|
|
895 if (eventPtr) {
|
|
896 XmlUpdatePosition(encoding, positionPtr, eventPtr, &position);
|
|
897 positionPtr = eventPtr;
|
|
898 }
|
|
899 return position.columnNumber;
|
|
900 }
|
|
901
|
|
902 void XML_DefaultCurrent(XML_Parser parser)
|
|
903 {
|
|
904 if (defaultHandler) {
|
|
905 if (openInternalEntities)
|
|
906 reportDefault(parser,
|
|
907 ns ? XmlGetInternalEncodingNS() : XmlGetInternalEncoding(),
|
|
908 openInternalEntities->internalEventPtr,
|
|
909 openInternalEntities->internalEventEndPtr);
|
|
910 else
|
|
911 reportDefault(parser, encoding, eventPtr, eventEndPtr);
|
|
912 }
|
|
913 }
|
|
914
|
|
915 const XML_LChar *XML_ErrorString(int code)
|
|
916 {
|
|
917 static const XML_LChar *message[] = {
|
|
918 0,
|
|
919 XML_T("out of memory"),
|
|
920 XML_T("syntax error"),
|
|
921 XML_T("no element found"),
|
|
922 XML_T("not well-formed"),
|
|
923 XML_T("unclosed token"),
|
|
924 XML_T("unclosed token"),
|
|
925 XML_T("mismatched tag"),
|
|
926 XML_T("duplicate attribute"),
|
|
927 XML_T("junk after document element"),
|
|
928 XML_T("illegal parameter entity reference"),
|
|
929 XML_T("undefined entity"),
|
|
930 XML_T("recursive entity reference"),
|
|
931 XML_T("asynchronous entity"),
|
|
932 XML_T("reference to invalid character number"),
|
|
933 XML_T("reference to binary entity"),
|
|
934 XML_T("reference to external entity in attribute"),
|
|
935 XML_T("xml processing instruction not at start of external entity"),
|
|
936 XML_T("unknown encoding"),
|
|
937 XML_T("encoding specified in XML declaration is incorrect"),
|
|
938 XML_T("unclosed CDATA section"),
|
|
939 XML_T("error in processing external entity reference"),
|
|
940 XML_T("document is not standalone")
|
|
941 };
|
|
942 if (code > 0 && code < sizeof(message)/sizeof(message[0]))
|
|
943 return message[code];
|
|
944 return 0;
|
|
945 }
|
|
946
|
|
947 static
|
|
948 enum XML_Error contentProcessor(XML_Parser parser,
|
|
949 const char *start,
|
|
950 const char *end,
|
|
951 const char **endPtr)
|
|
952 {
|
|
953 return doContent(parser, 0, encoding, start, end, endPtr);
|
|
954 }
|
|
955
|
|
956 static
|
|
957 enum XML_Error externalEntityInitProcessor(XML_Parser parser,
|
|
958 const char *start,
|
|
959 const char *end,
|
|
960 const char **endPtr)
|
|
961 {
|
|
962 enum XML_Error result = initializeEncoding(parser);
|
|
963 if (result != XML_ERROR_NONE)
|
|
964 return result;
|
|
965 processor = externalEntityInitProcessor2;
|
|
966 return externalEntityInitProcessor2(parser, start, end, endPtr);
|
|
967 }
|
|
968
|
|
969 static
|
|
970 enum XML_Error externalEntityInitProcessor2(XML_Parser parser,
|
|
971 const char *start,
|
|
972 const char *end,
|
|
973 const char **endPtr)
|
|
974 {
|
|
975 const char *next;
|
|
976 int tok = XmlContentTok(encoding, start, end, &next);
|
|
977 switch (tok) {
|
|
978 case XML_TOK_BOM:
|
|
979 start = next;
|
|
980 break;
|
|
981 case XML_TOK_PARTIAL:
|
|
982 if (endPtr) {
|
|
983 *endPtr = start;
|
|
984 return XML_ERROR_NONE;
|
|
985 }
|
|
986 eventPtr = start;
|
|
987 return XML_ERROR_UNCLOSED_TOKEN;
|
|
988 case XML_TOK_PARTIAL_CHAR:
|
|
989 if (endPtr) {
|
|
990 *endPtr = start;
|
|
991 return XML_ERROR_NONE;
|
|
992 }
|
|
993 eventPtr = start;
|
|
994 return XML_ERROR_PARTIAL_CHAR;
|
|
995 }
|
|
996 processor = externalEntityInitProcessor3;
|
|
997 return externalEntityInitProcessor3(parser, start, end, endPtr);
|
|
998 }
|
|
999
|
|
1000 static
|
|
1001 enum XML_Error externalEntityInitProcessor3(XML_Parser parser,
|
|
1002 const char *start,
|
|
1003 const char *end,
|
|
1004 const char **endPtr)
|
|
1005 {
|
|
1006 const char *next;
|
|
1007 int tok = XmlContentTok(encoding, start, end, &next);
|
|
1008 switch (tok) {
|
|
1009 case XML_TOK_XML_DECL:
|
|
1010 {
|
|
1011 enum XML_Error result = processXmlDecl(parser, 1, start, next);
|
|
1012 if (result != XML_ERROR_NONE)
|
|
1013 return result;
|
|
1014 start = next;
|
|
1015 }
|
|
1016 break;
|
|
1017 case XML_TOK_PARTIAL:
|
|
1018 if (endPtr) {
|
|
1019 *endPtr = start;
|
|
1020 return XML_ERROR_NONE;
|
|
1021 }
|
|
1022 eventPtr = start;
|
|
1023 return XML_ERROR_UNCLOSED_TOKEN;
|
|
1024 case XML_TOK_PARTIAL_CHAR:
|
|
1025 if (endPtr) {
|
|
1026 *endPtr = start;
|
|
1027 return XML_ERROR_NONE;
|
|
1028 }
|
|
1029 eventPtr = start;
|
|
1030 return XML_ERROR_PARTIAL_CHAR;
|
|
1031 }
|
|
1032 processor = externalEntityContentProcessor;
|
|
1033 tagLevel = 1;
|
|
1034 return doContent(parser, 1, encoding, start, end, endPtr);
|
|
1035 }
|
|
1036
|
|
1037 static
|
|
1038 enum XML_Error externalEntityContentProcessor(XML_Parser parser,
|
|
1039 const char *start,
|
|
1040 const char *end,
|
|
1041 const char **endPtr)
|
|
1042 {
|
|
1043 return doContent(parser, 1, encoding, start, end, endPtr);
|
|
1044 }
|
|
1045
|
|
1046 static enum XML_Error
|
|
1047 doContent(XML_Parser parser,
|
|
1048 int startTagLevel,
|
|
1049 const ENCODING *enc,
|
|
1050 const char *s,
|
|
1051 const char *end,
|
|
1052 const char **nextPtr)
|
|
1053 {
|
|
1054 const ENCODING *internalEnc = ns ? XmlGetInternalEncodingNS() : XmlGetInternalEncoding();
|
|
1055 const char **eventPP;
|
|
1056 const char **eventEndPP;
|
|
1057 if (enc == encoding) {
|
|
1058 eventPP = &eventPtr;
|
|
1059 eventEndPP = &eventEndPtr;
|
|
1060 }
|
|
1061 else {
|
|
1062 eventPP = &(openInternalEntities->internalEventPtr);
|
|
1063 eventEndPP = &(openInternalEntities->internalEventEndPtr);
|
|
1064 }
|
|
1065 *eventPP = s;
|
|
1066 for (;;) {
|
|
1067 const char *next = s; /* XmlContentTok doesn't always set the last arg */
|
|
1068 int tok = XmlContentTok(enc, s, end, &next);
|
|
1069 *eventEndPP = next;
|
|
1070 switch (tok) {
|
|
1071 case XML_TOK_TRAILING_CR:
|
|
1072 if (nextPtr) {
|
|
1073 *nextPtr = s;
|
|
1074 return XML_ERROR_NONE;
|
|
1075 }
|
|
1076 *eventEndPP = end;
|
|
1077 if (characterDataHandler) {
|
|
1078 XML_Char c = 0xA;
|
|
1079 characterDataHandler(handlerArg, &c, 1);
|
|
1080 }
|
|
1081 else if (defaultHandler)
|
|
1082 reportDefault(parser, enc, s, end);
|
|
1083 if (startTagLevel == 0)
|
|
1084 return XML_ERROR_NO_ELEMENTS;
|
|
1085 if (tagLevel != startTagLevel)
|
|
1086 return XML_ERROR_ASYNC_ENTITY;
|
|
1087 return XML_ERROR_NONE;
|
|
1088 case XML_TOK_NONE:
|
|
1089 if (nextPtr) {
|
|
1090 *nextPtr = s;
|
|
1091 return XML_ERROR_NONE;
|
|
1092 }
|
|
1093 if (startTagLevel > 0) {
|
|
1094 if (tagLevel != startTagLevel)
|
|
1095 return XML_ERROR_ASYNC_ENTITY;
|
|
1096 return XML_ERROR_NONE;
|
|
1097 }
|
|
1098 return XML_ERROR_NO_ELEMENTS;
|
|
1099 case XML_TOK_INVALID:
|
|
1100 *eventPP = next;
|
|
1101 return XML_ERROR_INVALID_TOKEN;
|
|
1102 case XML_TOK_PARTIAL:
|
|
1103 if (nextPtr) {
|
|
1104 *nextPtr = s;
|
|
1105 return XML_ERROR_NONE;
|
|
1106 }
|
|
1107 return XML_ERROR_UNCLOSED_TOKEN;
|
|
1108 case XML_TOK_PARTIAL_CHAR:
|
|
1109 if (nextPtr) {
|
|
1110 *nextPtr = s;
|
|
1111 return XML_ERROR_NONE;
|
|
1112 }
|
|
1113 return XML_ERROR_PARTIAL_CHAR;
|
|
1114 case XML_TOK_ENTITY_REF:
|
|
1115 {
|
|
1116 const XML_Char *name;
|
|
1117 ENTITY *entity;
|
|
1118 XML_Char ch = XmlPredefinedEntityName(enc,
|
|
1119 s + enc->minBytesPerChar,
|
|
1120 next - enc->minBytesPerChar);
|
|
1121 if (ch) {
|
|
1122 if (characterDataHandler)
|
|
1123 characterDataHandler(handlerArg, &ch, 1);
|
|
1124 else if (defaultHandler)
|
|
1125 reportDefault(parser, enc, s, next);
|
|
1126 break;
|
|
1127 }
|
|
1128 name = poolStoreString(&dtd.pool, enc,
|
|
1129 s + enc->minBytesPerChar,
|
|
1130 next - enc->minBytesPerChar);
|
|
1131 if (!name)
|
|
1132 return XML_ERROR_NO_MEMORY;
|
|
1133 entity = (ENTITY *)lookup(&dtd.generalEntities, name, 0);
|
|
1134 poolDiscard(&dtd.pool);
|
|
1135 if (!entity) {
|
|
1136 if (dtd.complete || dtd.standalone)
|
|
1137 return XML_ERROR_UNDEFINED_ENTITY;
|
|
1138 if (defaultHandler)
|
|
1139 reportDefault(parser, enc, s, next);
|
|
1140 break;
|
|
1141 }
|
|
1142 if (entity->open)
|
|
1143 return XML_ERROR_RECURSIVE_ENTITY_REF;
|
|
1144 if (entity->notation)
|
|
1145 return XML_ERROR_BINARY_ENTITY_REF;
|
|
1146 if (entity) {
|
|
1147 if (entity->textPtr) {
|
|
1148 enum XML_Error result;
|
|
1149 OPEN_INTERNAL_ENTITY openEntity;
|
|
1150 if (defaultHandler && !defaultExpandInternalEntities) {
|
|
1151 reportDefault(parser, enc, s, next);
|
|
1152 break;
|
|
1153 }
|
|
1154 entity->open = 1;
|
|
1155 openEntity.next = openInternalEntities;
|
|
1156 openInternalEntities = &openEntity;
|
|
1157 openEntity.entity = entity;
|
|
1158 openEntity.internalEventPtr = 0;
|
|
1159 openEntity.internalEventEndPtr = 0;
|
|
1160 result = doContent(parser,
|
|
1161 tagLevel,
|
|
1162 internalEnc,
|
|
1163 (char *)entity->textPtr,
|
|
1164 (char *)(entity->textPtr + entity->textLen),
|
|
1165 0);
|
|
1166 entity->open = 0;
|
|
1167 openInternalEntities = openEntity.next;
|
|
1168 if (result)
|
|
1169 return result;
|
|
1170 }
|
|
1171 else if (externalEntityRefHandler) {
|
|
1172 const XML_Char *context;
|
|
1173 entity->open = 1;
|
|
1174 context = getContext(parser);
|
|
1175 entity->open = 0;
|
|
1176 if (!context)
|
|
1177 return XML_ERROR_NO_MEMORY;
|
|
1178 if (!externalEntityRefHandler(externalEntityRefHandlerArg,
|
|
1179 context,
|
|
1180 dtd.base,
|
|
1181 entity->systemId,
|
|
1182 entity->publicId))
|
|
1183 return XML_ERROR_EXTERNAL_ENTITY_HANDLING;
|
|
1184 poolDiscard(&tempPool);
|
|
1185 }
|
|
1186 else if (defaultHandler)
|
|
1187 reportDefault(parser, enc, s, next);
|
|
1188 }
|
|
1189 break;
|
|
1190 }
|
|
1191 case XML_TOK_START_TAG_WITH_ATTS:
|
|
1192 if (!startElementHandler) {
|
|
1193 enum XML_Error result = storeAtts(parser, enc, s, 0, 0);
|
|
1194 if (result)
|
|
1195 return result;
|
|
1196 }
|
|
1197 /* fall through */
|
|
1198 case XML_TOK_START_TAG_NO_ATTS:
|
|
1199 {
|
|
1200 TAG *tag;
|
|
1201 if (freeTagList) {
|
|
1202 tag = freeTagList;
|
|
1203 freeTagList = freeTagList->parent;
|
|
1204 }
|
|
1205 else {
|
|
1206 tag = malloc(sizeof(TAG));
|
|
1207 if (!tag)
|
|
1208 return XML_ERROR_NO_MEMORY;
|
|
1209 tag->buf = malloc(INIT_TAG_BUF_SIZE);
|
|
1210 if (!tag->buf)
|
|
1211 return XML_ERROR_NO_MEMORY;
|
|
1212 tag->bufEnd = tag->buf + INIT_TAG_BUF_SIZE;
|
|
1213 }
|
|
1214 tag->bindings = 0;
|
|
1215 tag->parent = tagStack;
|
|
1216 tagStack = tag;
|
|
1217 tag->name.localPart = 0;
|
|
1218 tag->rawName = s + enc->minBytesPerChar;
|
|
1219 tag->rawNameLength = XmlNameLength(enc, tag->rawName);
|
|
1220 if (nextPtr) {
|
|
1221 /* Need to guarantee that:
|
|
1222 tag->buf + ROUND_UP(tag->rawNameLength, sizeof(XML_Char)) <= tag->bufEnd - sizeof(XML_Char) */
|
|
1223 if (tag->rawNameLength + (int)(sizeof(XML_Char) - 1) + (int)sizeof(XML_Char) > tag->bufEnd - tag->buf) {
|
|
1224 int bufSize = tag->rawNameLength * 4;
|
|
1225 bufSize = ROUND_UP(bufSize, sizeof(XML_Char));
|
|
1226 tag->buf = realloc(tag->buf, bufSize);
|
|
1227 if (!tag->buf)
|
|
1228 return XML_ERROR_NO_MEMORY;
|
|
1229 tag->bufEnd = tag->buf + bufSize;
|
|
1230 }
|
|
1231 memcpy(tag->buf, tag->rawName, tag->rawNameLength);
|
|
1232 tag->rawName = tag->buf;
|
|
1233 }
|
|
1234 ++tagLevel;
|
|
1235 if (startElementHandler) {
|
|
1236 enum XML_Error result;
|
|
1237 XML_Char *toPtr;
|
|
1238 for (;;) {
|
|
1239 const char *rawNameEnd = tag->rawName + tag->rawNameLength;
|
|
1240 const char *fromPtr = tag->rawName;
|
|
1241 int bufSize;
|
|
1242 if (nextPtr)
|
|
1243 toPtr = (XML_Char *)(tag->buf + ROUND_UP(tag->rawNameLength, sizeof(XML_Char)));
|
|
1244 else
|
|
1245 toPtr = (XML_Char *)tag->buf;
|
|
1246 tag->name.str = toPtr;
|
|
1247 XmlConvert(enc,
|
|
1248 &fromPtr, rawNameEnd,
|
|
1249 (ICHAR **)&toPtr, (ICHAR *)tag->bufEnd - 1);
|
|
1250 if (fromPtr == rawNameEnd)
|
|
1251 break;
|
|
1252 bufSize = (tag->bufEnd - tag->buf) << 1;
|
|
1253 tag->buf = realloc(tag->buf, bufSize);
|
|
1254 if (!tag->buf)
|
|
1255 return XML_ERROR_NO_MEMORY;
|
|
1256 tag->bufEnd = tag->buf + bufSize;
|
|
1257 if (nextPtr)
|
|
1258 tag->rawName = tag->buf;
|
|
1259 }
|
|
1260 *toPtr = XML_T('\0');
|
|
1261 result = storeAtts(parser, enc, s, &(tag->name), &(tag->bindings));
|
|
1262 if (result)
|
|
1263 return result;
|
|
1264 startElementHandler(handlerArg, tag->name.str, (const XML_Char **)atts);
|
|
1265 poolClear(&tempPool);
|
|
1266 }
|
|
1267 else {
|
|
1268 tag->name.str = 0;
|
|
1269 if (defaultHandler)
|
|
1270 reportDefault(parser, enc, s, next);
|
|
1271 }
|
|
1272 break;
|
|
1273 }
|
|
1274 case XML_TOK_EMPTY_ELEMENT_WITH_ATTS:
|
|
1275 if (!startElementHandler) {
|
|
1276 enum XML_Error result = storeAtts(parser, enc, s, 0, 0);
|
|
1277 if (result)
|
|
1278 return result;
|
|
1279 }
|
|
1280 /* fall through */
|
|
1281 case XML_TOK_EMPTY_ELEMENT_NO_ATTS:
|
|
1282 if (startElementHandler || endElementHandler) {
|
|
1283 const char *rawName = s + enc->minBytesPerChar;
|
|
1284 enum XML_Error result;
|
|
1285 BINDING *bindings = 0;
|
|
1286 TAG_NAME name;
|
|
1287 name.str = poolStoreString(&tempPool, enc, rawName,
|
|
1288 rawName + XmlNameLength(enc, rawName));
|
|
1289 if (!name.str)
|
|
1290 return XML_ERROR_NO_MEMORY;
|
|
1291 poolFinish(&tempPool);
|
|
1292 result = storeAtts(parser, enc, s, &name, &bindings);
|
|
1293 if (result)
|
|
1294 return result;
|
|
1295 poolFinish(&tempPool);
|
|
1296 if (startElementHandler)
|
|
1297 startElementHandler(handlerArg, name.str, (const XML_Char **)atts);
|
|
1298 if (endElementHandler) {
|
|
1299 if (startElementHandler)
|
|
1300 *eventPP = *eventEndPP;
|
|
1301 endElementHandler(handlerArg, name.str);
|
|
1302 }
|
|
1303 poolClear(&tempPool);
|
|
1304 while (bindings) {
|
|
1305 BINDING *b = bindings;
|
|
1306 if (endNamespaceDeclHandler)
|
|
1307 endNamespaceDeclHandler(handlerArg, b->prefix->name);
|
|
1308 bindings = bindings->nextTagBinding;
|
|
1309 b->nextTagBinding = freeBindingList;
|
|
1310 freeBindingList = b;
|
|
1311 b->prefix->binding = b->prevPrefixBinding;
|
|
1312 }
|
|
1313 }
|
|
1314 else if (defaultHandler)
|
|
1315 reportDefault(parser, enc, s, next);
|
|
1316 if (tagLevel == 0)
|
|
1317 return epilogProcessor(parser, next, end, nextPtr);
|
|
1318 break;
|
|
1319 case XML_TOK_END_TAG:
|
|
1320 if (tagLevel == startTagLevel)
|
|
1321 return XML_ERROR_ASYNC_ENTITY;
|
|
1322 else {
|
|
1323 int len;
|
|
1324 const char *rawName;
|
|
1325 TAG *tag = tagStack;
|
|
1326 tagStack = tag->parent;
|
|
1327 tag->parent = freeTagList;
|
|
1328 freeTagList = tag;
|
|
1329 rawName = s + enc->minBytesPerChar*2;
|
|
1330 len = XmlNameLength(enc, rawName);
|
|
1331 if (len != tag->rawNameLength
|
|
1332 || memcmp(tag->rawName, rawName, len) != 0) {
|
|
1333 *eventPP = rawName;
|
|
1334 return XML_ERROR_TAG_MISMATCH;
|
|
1335 }
|
|
1336 --tagLevel;
|
|
1337 if (endElementHandler && tag->name.str) {
|
|
1338 if (tag->name.localPart) {
|
|
1339 XML_Char *to = (XML_Char *)tag->name.str + tag->name.uriLen;
|
|
1340 const XML_Char *from = tag->name.localPart;
|
|
1341 while ((*to++ = *from++) != 0)
|
|
1342 ;
|
|
1343 }
|
|
1344 endElementHandler(handlerArg, tag->name.str);
|
|
1345 }
|
|
1346 else if (defaultHandler)
|
|
1347 reportDefault(parser, enc, s, next);
|
|
1348 while (tag->bindings) {
|
|
1349 BINDING *b = tag->bindings;
|
|
1350 if (endNamespaceDeclHandler)
|
|
1351 endNamespaceDeclHandler(handlerArg, b->prefix->name);
|
|
1352 tag->bindings = tag->bindings->nextTagBinding;
|
|
1353 b->nextTagBinding = freeBindingList;
|
|
1354 freeBindingList = b;
|
|
1355 b->prefix->binding = b->prevPrefixBinding;
|
|
1356 }
|
|
1357 if (tagLevel == 0)
|
|
1358 return epilogProcessor(parser, next, end, nextPtr);
|
|
1359 }
|
|
1360 break;
|
|
1361 case XML_TOK_CHAR_REF:
|
|
1362 {
|
|
1363 int n = XmlCharRefNumber(enc, s);
|
|
1364 if (n < 0)
|
|
1365 return XML_ERROR_BAD_CHAR_REF;
|
|
1366 if (characterDataHandler) {
|
|
1367 XML_Char buf[XML_ENCODE_MAX];
|
|
1368 characterDataHandler(handlerArg, buf, XmlEncode(n, (ICHAR *)buf));
|
|
1369 }
|
|
1370 else if (defaultHandler)
|
|
1371 reportDefault(parser, enc, s, next);
|
|
1372 }
|
|
1373 break;
|
|
1374 case XML_TOK_XML_DECL:
|
|
1375 return XML_ERROR_MISPLACED_XML_PI;
|
|
1376 case XML_TOK_DATA_NEWLINE:
|
|
1377 if (characterDataHandler) {
|
|
1378 XML_Char c = 0xA;
|
|
1379 characterDataHandler(handlerArg, &c, 1);
|
|
1380 }
|
|
1381 else if (defaultHandler)
|
|
1382 reportDefault(parser, enc, s, next);
|
|
1383 break;
|
|
1384 case XML_TOK_CDATA_SECT_OPEN:
|
|
1385 {
|
|
1386 enum XML_Error result;
|
|
1387 if (startCdataSectionHandler)
|
|
1388 startCdataSectionHandler(handlerArg);
|
|
1389 #if 0
|
|
1390 /* Suppose you doing a transformation on a document that involves
|
|
1391 changing only the character data. You set up a defaultHandler
|
|
1392 and a characterDataHandler. The defaultHandler simply copies
|
|
1393 characters through. The characterDataHandler does the transformation
|
|
1394 and writes the characters out escaping them as necessary. This case
|
|
1395 will fail to work if we leave out the following two lines (because &
|
|
1396 and < inside CDATA sections will be incorrectly escaped).
|
|
1397
|
|
1398 However, now we have a start/endCdataSectionHandler, so it seems
|
|
1399 easier to let the user deal with this. */
|
|
1400
|
|
1401 else if (characterDataHandler)
|
|
1402 characterDataHandler(handlerArg, dataBuf, 0);
|
|
1403 #endif
|
|
1404 else if (defaultHandler)
|
|
1405 reportDefault(parser, enc, s, next);
|
|
1406 result = doCdataSection(parser, enc, &next, end, nextPtr);
|
|
1407 if (!next) {
|
|
1408 processor = cdataSectionProcessor;
|
|
1409 return result;
|
|
1410 }
|
|
1411 }
|
|
1412 break;
|
|
1413 case XML_TOK_TRAILING_RSQB:
|
|
1414 if (nextPtr) {
|
|
1415 *nextPtr = s;
|
|
1416 return XML_ERROR_NONE;
|
|
1417 }
|
|
1418 if (characterDataHandler) {
|
|
1419 if (MUST_CONVERT(enc, s)) {
|
|
1420 ICHAR *dataPtr = (ICHAR *)dataBuf;
|
|
1421 XmlConvert(enc, &s, end, &dataPtr, (ICHAR *)dataBufEnd);
|
|
1422 characterDataHandler(handlerArg, dataBuf, dataPtr - (ICHAR *)dataBuf);
|
|
1423 }
|
|
1424 else
|
|
1425 characterDataHandler(handlerArg,
|
|
1426 (XML_Char *)s,
|
|
1427 (XML_Char *)end - (XML_Char *)s);
|
|
1428 }
|
|
1429 else if (defaultHandler)
|
|
1430 reportDefault(parser, enc, s, end);
|
|
1431 if (startTagLevel == 0) {
|
|
1432 *eventPP = end;
|
|
1433 return XML_ERROR_NO_ELEMENTS;
|
|
1434 }
|
|
1435 if (tagLevel != startTagLevel) {
|
|
1436 *eventPP = end;
|
|
1437 return XML_ERROR_ASYNC_ENTITY;
|
|
1438 }
|
|
1439 return XML_ERROR_NONE;
|
|
1440 case XML_TOK_DATA_CHARS:
|
|
1441 if (characterDataHandler) {
|
|
1442 if (MUST_CONVERT(enc, s)) {
|
|
1443 for (;;) {
|
|
1444 ICHAR *dataPtr = (ICHAR *)dataBuf;
|
|
1445 XmlConvert(enc, &s, next, &dataPtr, (ICHAR *)dataBufEnd);
|
|
1446 *eventEndPP = s;
|
|
1447 characterDataHandler(handlerArg, dataBuf, dataPtr - (ICHAR *)dataBuf);
|
|
1448 if (s == next)
|
|
1449 break;
|
|
1450 *eventPP = s;
|
|
1451 }
|
|
1452 }
|
|
1453 else
|
|
1454 characterDataHandler(handlerArg,
|
|
1455 (XML_Char *)s,
|
|
1456 (XML_Char *)next - (XML_Char *)s);
|
|
1457 }
|
|
1458 else if (defaultHandler)
|
|
1459 reportDefault(parser, enc, s, next);
|
|
1460 break;
|
|
1461 case XML_TOK_PI:
|
|
1462 if (!reportProcessingInstruction(parser, enc, s, next))
|
|
1463 return XML_ERROR_NO_MEMORY;
|
|
1464 break;
|
|
1465 case XML_TOK_COMMENT:
|
|
1466 if (!reportComment(parser, enc, s, next))
|
|
1467 return XML_ERROR_NO_MEMORY;
|
|
1468 break;
|
|
1469 default:
|
|
1470 if (defaultHandler)
|
|
1471 reportDefault(parser, enc, s, next);
|
|
1472 break;
|
|
1473 }
|
|
1474 *eventPP = s = next;
|
|
1475 }
|
|
1476 /* not reached */
|
|
1477 }
|
|
1478
|
|
1479 /* If tagNamePtr is non-null, build a real list of attributes,
|
|
1480 otherwise just check the attributes for well-formedness. */
|
|
1481
|
|
1482 static enum XML_Error storeAtts(XML_Parser parser, const ENCODING *enc,
|
|
1483 const char *s, TAG_NAME *tagNamePtr,
|
|
1484 BINDING **bindingsPtr)
|
|
1485 {
|
|
1486 ELEMENT_TYPE *elementType = 0;
|
|
1487 int nDefaultAtts = 0;
|
|
1488 const XML_Char **appAtts;
|
|
1489 int attIndex = 0;
|
|
1490 int i;
|
|
1491 int n;
|
|
1492 int nPrefixes = 0;
|
|
1493 BINDING *binding;
|
|
1494 const XML_Char *localPart;
|
|
1495
|
|
1496 if (tagNamePtr) {
|
|
1497 elementType = (ELEMENT_TYPE *)lookup(&dtd.elementTypes, tagNamePtr->str, 0);
|
|
1498 if (!elementType) {
|
|
1499 tagNamePtr->str = poolCopyString(&dtd.pool, tagNamePtr->str);
|
|
1500 if (!tagNamePtr->str)
|
|
1501 return XML_ERROR_NO_MEMORY;
|
|
1502 elementType = (ELEMENT_TYPE *)lookup(&dtd.elementTypes, tagNamePtr->str, sizeof(ELEMENT_TYPE));
|
|
1503 if (!elementType)
|
|
1504 return XML_ERROR_NO_MEMORY;
|
|
1505 if (ns && !setElementTypePrefix(parser, elementType))
|
|
1506 return XML_ERROR_NO_MEMORY;
|
|
1507 }
|
|
1508 nDefaultAtts = elementType->nDefaultAtts;
|
|
1509 }
|
|
1510 n = XmlGetAttributes(enc, s, attsSize, atts);
|
|
1511 if (n + nDefaultAtts > attsSize) {
|
|
1512 int oldAttsSize = attsSize;
|
|
1513 attsSize = n + nDefaultAtts + INIT_ATTS_SIZE;
|
|
1514 atts = realloc((void *)atts, attsSize * sizeof(ATTRIBUTE));
|
|
1515 if (!atts)
|
|
1516 return XML_ERROR_NO_MEMORY;
|
|
1517 if (n > oldAttsSize)
|
|
1518 XmlGetAttributes(enc, s, n, atts);
|
|
1519 }
|
|
1520 appAtts = (const XML_Char **)atts;
|
|
1521 for (i = 0; i < n; i++) {
|
|
1522 ATTRIBUTE_ID *attId = getAttributeId(parser, enc, atts[i].name,
|
|
1523 atts[i].name
|
|
1524 + XmlNameLength(enc, atts[i].name));
|
|
1525 if (!attId)
|
|
1526 return XML_ERROR_NO_MEMORY;
|
|
1527 if ((attId->name)[-1]) {
|
|
1528 if (enc == encoding)
|
|
1529 eventPtr = atts[i].name;
|
|
1530 return XML_ERROR_DUPLICATE_ATTRIBUTE;
|
|
1531 }
|
|
1532 (attId->name)[-1] = 1;
|
|
1533 appAtts[attIndex++] = attId->name;
|
|
1534 if (!atts[i].normalized) {
|
|
1535 enum XML_Error result;
|
|
1536 int isCdata = 1;
|
|
1537
|
|
1538 if (attId->maybeTokenized) {
|
|
1539 int j;
|
|
1540 for (j = 0; j < nDefaultAtts; j++) {
|
|
1541 if (attId == elementType->defaultAtts[j].id) {
|
|
1542 isCdata = elementType->defaultAtts[j].isCdata;
|
|
1543 break;
|
|
1544 }
|
|
1545 }
|
|
1546 }
|
|
1547
|
|
1548 result = storeAttributeValue(parser, enc, isCdata,
|
|
1549 atts[i].valuePtr, atts[i].valueEnd,
|
|
1550 &tempPool);
|
|
1551 if (result)
|
|
1552 return result;
|
|
1553 if (tagNamePtr) {
|
|
1554 appAtts[attIndex] = poolStart(&tempPool);
|
|
1555 poolFinish(&tempPool);
|
|
1556 }
|
|
1557 else
|
|
1558 poolDiscard(&tempPool);
|
|
1559 }
|
|
1560 else if (tagNamePtr) {
|
|
1561 appAtts[attIndex] = poolStoreString(&tempPool, enc, atts[i].valuePtr, atts[i].valueEnd);
|
|
1562 if (appAtts[attIndex] == 0)
|
|
1563 return XML_ERROR_NO_MEMORY;
|
|
1564 poolFinish(&tempPool);
|
|
1565 }
|
|
1566 if (attId->prefix && tagNamePtr) {
|
|
1567 if (attId->xmlns) {
|
|
1568 if (!addBinding(parser, attId->prefix, attId, appAtts[attIndex], bindingsPtr))
|
|
1569 return XML_ERROR_NO_MEMORY;
|
|
1570 --attIndex;
|
|
1571 }
|
|
1572 else {
|
|
1573 attIndex++;
|
|
1574 nPrefixes++;
|
|
1575 (attId->name)[-1] = 2;
|
|
1576 }
|
|
1577 }
|
|
1578 else
|
|
1579 attIndex++;
|
|
1580 }
|
|
1581 nSpecifiedAtts = attIndex;
|
|
1582 if (tagNamePtr) {
|
|
1583 int j;
|
|
1584 for (j = 0; j < nDefaultAtts; j++) {
|
|
1585 const DEFAULT_ATTRIBUTE *da = elementType->defaultAtts + j;
|
|
1586 if (!(da->id->name)[-1] && da->value) {
|
|
1587 if (da->id->prefix) {
|
|
1588 if (da->id->xmlns) {
|
|
1589 if (!addBinding(parser, da->id->prefix, da->id, da->value, bindingsPtr))
|
|
1590 return XML_ERROR_NO_MEMORY;
|
|
1591 }
|
|
1592 else {
|
|
1593 (da->id->name)[-1] = 2;
|
|
1594 nPrefixes++;
|
|
1595 appAtts[attIndex++] = da->id->name;
|
|
1596 appAtts[attIndex++] = da->value;
|
|
1597 }
|
|
1598 }
|
|
1599 else {
|
|
1600 (da->id->name)[-1] = 1;
|
|
1601 appAtts[attIndex++] = da->id->name;
|
|
1602 appAtts[attIndex++] = da->value;
|
|
1603 }
|
|
1604 }
|
|
1605 }
|
|
1606 appAtts[attIndex] = 0;
|
|
1607 }
|
|
1608 i = 0;
|
|
1609 if (nPrefixes) {
|
|
1610 for (; i < attIndex; i += 2) {
|
|
1611 if (appAtts[i][-1] == 2) {
|
|
1612 ATTRIBUTE_ID *id;
|
|
1613 ((XML_Char *)(appAtts[i]))[-1] = 0;
|
|
1614 id = (ATTRIBUTE_ID *)lookup(&dtd.attributeIds, appAtts[i], 0);
|
|
1615 if (id->prefix->binding) {
|
|
1616 int j;
|
|
1617 const BINDING *b = id->prefix->binding;
|
|
1618 const XML_Char *s = appAtts[i];
|
|
1619 for (j = 0; j < b->uriLen; j++) {
|
|
1620 if (!poolAppendChar(&tempPool, b->uri[j]))
|
|
1621 return XML_ERROR_NO_MEMORY;
|
|
1622 }
|
|
1623 while (*s++ != ':')
|
|
1624 ;
|
|
1625 do {
|
|
1626 if (!poolAppendChar(&tempPool, *s))
|
|
1627 return XML_ERROR_NO_MEMORY;
|
|
1628 } while (*s++);
|
|
1629 appAtts[i] = poolStart(&tempPool);
|
|
1630 poolFinish(&tempPool);
|
|
1631 }
|
|
1632 if (!--nPrefixes)
|
|
1633 break;
|
|
1634 }
|
|
1635 else
|
|
1636 ((XML_Char *)(appAtts[i]))[-1] = 0;
|
|
1637 }
|
|
1638 }
|
|
1639 for (; i < attIndex; i += 2)
|
|
1640 ((XML_Char *)(appAtts[i]))[-1] = 0;
|
|
1641 if (!tagNamePtr)
|
|
1642 return XML_ERROR_NONE;
|
|
1643 for (binding = *bindingsPtr; binding; binding = binding->nextTagBinding)
|
|
1644 binding->attId->name[-1] = 0;
|
|
1645 if (elementType->prefix) {
|
|
1646 binding = elementType->prefix->binding;
|
|
1647 if (!binding)
|
|
1648 return XML_ERROR_NONE;
|
|
1649 localPart = tagNamePtr->str;
|
|
1650 while (*localPart++ != XML_T(':'))
|
|
1651 ;
|
|
1652 }
|
|
1653 else if (dtd.defaultPrefix.binding) {
|
|
1654 binding = dtd.defaultPrefix.binding;
|
|
1655 localPart = tagNamePtr->str;
|
|
1656 }
|
|
1657 else
|
|
1658 return XML_ERROR_NONE;
|
|
1659 tagNamePtr->localPart = localPart;
|
|
1660 tagNamePtr->uriLen = binding->uriLen;
|
|
1661 i = binding->uriLen;
|
|
1662 do {
|
|
1663 if (i == binding->uriAlloc) {
|
|
1664 binding->uri = realloc(binding->uri, binding->uriAlloc *= 2);
|
|
1665 if (!binding->uri)
|
|
1666 return XML_ERROR_NO_MEMORY;
|
|
1667 }
|
|
1668 binding->uri[i++] = *localPart;
|
|
1669 } while (*localPart++);
|
|
1670 tagNamePtr->str = binding->uri;
|
|
1671 return XML_ERROR_NONE;
|
|
1672 }
|
|
1673
|
|
1674 static
|
|
1675 int addBinding(XML_Parser parser, PREFIX *prefix, const ATTRIBUTE_ID *attId, const XML_Char *uri, BINDING **bindingsPtr)
|
|
1676 {
|
|
1677 BINDING *b;
|
|
1678 int len;
|
|
1679 for (len = 0; uri[len]; len++)
|
|
1680 ;
|
|
1681 if (namespaceSeparator)
|
|
1682 len++;
|
|
1683 if (freeBindingList) {
|
|
1684 b = freeBindingList;
|
|
1685 if (len > b->uriAlloc) {
|
|
1686 b->uri = realloc(b->uri, len + EXPAND_SPARE);
|
|
1687 if (!b->uri)
|
|
1688 return 0;
|
|
1689 b->uriAlloc = len + EXPAND_SPARE;
|
|
1690 }
|
|
1691 freeBindingList = b->nextTagBinding;
|
|
1692 }
|
|
1693 else {
|
|
1694 b = malloc(sizeof(BINDING));
|
|
1695 if (!b)
|
|
1696 return 0;
|
|
1697 b->uri = malloc(sizeof(XML_Char) * len + EXPAND_SPARE);
|
|
1698 if (!b->uri) {
|
|
1699 free(b);
|
|
1700 return 0;
|
|
1701 }
|
|
1702 b->uriAlloc = len;
|
|
1703 }
|
|
1704 b->uriLen = len;
|
|
1705 memcpy(b->uri, uri, len * sizeof(XML_Char));
|
|
1706 if (namespaceSeparator)
|
|
1707 b->uri[len - 1] = namespaceSeparator;
|
|
1708 b->prefix = prefix;
|
|
1709 b->attId = attId;
|
|
1710 b->prevPrefixBinding = prefix->binding;
|
|
1711 if (*uri == XML_T('\0') && prefix == &dtd.defaultPrefix)
|
|
1712 prefix->binding = 0;
|
|
1713 else
|
|
1714 prefix->binding = b;
|
|
1715 b->nextTagBinding = *bindingsPtr;
|
|
1716 *bindingsPtr = b;
|
|
1717 if (startNamespaceDeclHandler)
|
|
1718 startNamespaceDeclHandler(handlerArg, prefix->name,
|
|
1719 prefix->binding ? uri : 0);
|
|
1720 return 1;
|
|
1721 }
|
|
1722
|
|
1723 /* The idea here is to avoid using stack for each CDATA section when
|
|
1724 the whole file is parsed with one call. */
|
|
1725
|
|
1726 static
|
|
1727 enum XML_Error cdataSectionProcessor(XML_Parser parser,
|
|
1728 const char *start,
|
|
1729 const char *end,
|
|
1730 const char **endPtr)
|
|
1731 {
|
|
1732 enum XML_Error result = doCdataSection(parser, encoding, &start, end, endPtr);
|
|
1733 if (start) {
|
|
1734 processor = contentProcessor;
|
|
1735 return contentProcessor(parser, start, end, endPtr);
|
|
1736 }
|
|
1737 return result;
|
|
1738 }
|
|
1739
|
|
1740 /* startPtr gets set to non-null is the section is closed, and to null if
|
|
1741 the section is not yet closed. */
|
|
1742
|
|
1743 static
|
|
1744 enum XML_Error doCdataSection(XML_Parser parser,
|
|
1745 const ENCODING *enc,
|
|
1746 const char **startPtr,
|
|
1747 const char *end,
|
|
1748 const char **nextPtr)
|
|
1749 {
|
|
1750 const char *s = *startPtr;
|
|
1751 const char **eventPP;
|
|
1752 const char **eventEndPP;
|
|
1753 if (enc == encoding) {
|
|
1754 eventPP = &eventPtr;
|
|
1755 *eventPP = s;
|
|
1756 eventEndPP = &eventEndPtr;
|
|
1757 }
|
|
1758 else {
|
|
1759 eventPP = &(openInternalEntities->internalEventPtr);
|
|
1760 eventEndPP = &(openInternalEntities->internalEventEndPtr);
|
|
1761 }
|
|
1762 *eventPP = s;
|
|
1763 *startPtr = 0;
|
|
1764 for (;;) {
|
|
1765 const char *next;
|
|
1766 int tok = XmlCdataSectionTok(enc, s, end, &next);
|
|
1767 *eventEndPP = next;
|
|
1768 switch (tok) {
|
|
1769 case XML_TOK_CDATA_SECT_CLOSE:
|
|
1770 if (endCdataSectionHandler)
|
|
1771 endCdataSectionHandler(handlerArg);
|
|
1772 #if 0
|
|
1773 /* see comment under XML_TOK_CDATA_SECT_OPEN */
|
|
1774 else if (characterDataHandler)
|
|
1775 characterDataHandler(handlerArg, dataBuf, 0);
|
|
1776 #endif
|
|
1777 else if (defaultHandler)
|
|
1778 reportDefault(parser, enc, s, next);
|
|
1779 *startPtr = next;
|
|
1780 return XML_ERROR_NONE;
|
|
1781 case XML_TOK_DATA_NEWLINE:
|
|
1782 if (characterDataHandler) {
|
|
1783 XML_Char c = 0xA;
|
|
1784 characterDataHandler(handlerArg, &c, 1);
|
|
1785 }
|
|
1786 else if (defaultHandler)
|
|
1787 reportDefault(parser, enc, s, next);
|
|
1788 break;
|
|
1789 case XML_TOK_DATA_CHARS:
|
|
1790 if (characterDataHandler) {
|
|
1791 if (MUST_CONVERT(enc, s)) {
|
|
1792 for (;;) {
|
|
1793 ICHAR *dataPtr = (ICHAR *)dataBuf;
|
|
1794 XmlConvert(enc, &s, next, &dataPtr, (ICHAR *)dataBufEnd);
|
|
1795 *eventEndPP = next;
|
|
1796 characterDataHandler(handlerArg, dataBuf, dataPtr - (ICHAR *)dataBuf);
|
|
1797 if (s == next)
|
|
1798 break;
|
|
1799 *eventPP = s;
|
|
1800 }
|
|
1801 }
|
|
1802 else
|
|
1803 characterDataHandler(handlerArg,
|
|
1804 (XML_Char *)s,
|
|
1805 (XML_Char *)next - (XML_Char *)s);
|
|
1806 }
|
|
1807 else if (defaultHandler)
|
|
1808 reportDefault(parser, enc, s, next);
|
|
1809 break;
|
|
1810 case XML_TOK_INVALID:
|
|
1811 *eventPP = next;
|
|
1812 return XML_ERROR_INVALID_TOKEN;
|
|
1813 case XML_TOK_PARTIAL_CHAR:
|
|
1814 if (nextPtr) {
|
|
1815 *nextPtr = s;
|
|
1816 return XML_ERROR_NONE;
|
|
1817 }
|
|
1818 return XML_ERROR_PARTIAL_CHAR;
|
|
1819 case XML_TOK_PARTIAL:
|
|
1820 case XML_TOK_NONE:
|
|
1821 if (nextPtr) {
|
|
1822 *nextPtr = s;
|
|
1823 return XML_ERROR_NONE;
|
|
1824 }
|
|
1825 return XML_ERROR_UNCLOSED_CDATA_SECTION;
|
|
1826 default:
|
|
1827 abort();
|
|
1828 }
|
|
1829 *eventPP = s = next;
|
|
1830 }
|
|
1831 /* not reached */
|
|
1832 }
|
|
1833
|
|
1834 static enum XML_Error
|
|
1835 initializeEncoding(XML_Parser parser)
|
|
1836 {
|
|
1837 const char *s;
|
|
1838 #ifdef XML_UNICODE
|
|
1839 char encodingBuf[128];
|
|
1840 if (!protocolEncodingName)
|
|
1841 s = 0;
|
|
1842 else {
|
|
1843 int i;
|
|
1844 for (i = 0; protocolEncodingName[i]; i++) {
|
|
1845 if (i == sizeof(encodingBuf) - 1
|
|
1846 || protocolEncodingName[i] >= 0x80
|
|
1847 || protocolEncodingName[i] < 0) {
|
|
1848 encodingBuf[0] = '\0';
|
|
1849 break;
|
|
1850 }
|
|
1851 encodingBuf[i] = (char)protocolEncodingName[i];
|
|
1852 }
|
|
1853 encodingBuf[i] = '\0';
|
|
1854 s = encodingBuf;
|
|
1855 }
|
|
1856 #else
|
|
1857 s = protocolEncodingName;
|
|
1858 #endif
|
|
1859 if ((ns ? XmlInitEncodingNS : XmlInitEncoding)(&initEncoding, &encoding, s))
|
|
1860 return XML_ERROR_NONE;
|
|
1861 return handleUnknownEncoding(parser, protocolEncodingName);
|
|
1862 }
|
|
1863
|
|
1864 static enum XML_Error
|
|
1865 processXmlDecl(XML_Parser parser, int isGeneralTextEntity,
|
|
1866 const char *s, const char *next)
|
|
1867 {
|
|
1868 const char *encodingName = 0;
|
|
1869 const ENCODING *newEncoding = 0;
|
|
1870 const char *version;
|
|
1871 int standalone = -1;
|
|
1872 if (!(ns
|
|
1873 ? XmlParseXmlDeclNS
|
|
1874 : XmlParseXmlDecl)(isGeneralTextEntity,
|
|
1875 encoding,
|
|
1876 s,
|
|
1877 next,
|
|
1878 &eventPtr,
|
|
1879 &version,
|
|
1880 &encodingName,
|
|
1881 &newEncoding,
|
|
1882 &standalone))
|
|
1883 return XML_ERROR_SYNTAX;
|
|
1884 if (!isGeneralTextEntity && standalone == 1)
|
|
1885 dtd.standalone = 1;
|
|
1886 if (defaultHandler)
|
|
1887 reportDefault(parser, encoding, s, next);
|
|
1888 if (!protocolEncodingName) {
|
|
1889 if (newEncoding) {
|
|
1890 if (newEncoding->minBytesPerChar != encoding->minBytesPerChar) {
|
|
1891 eventPtr = encodingName;
|
|
1892 return XML_ERROR_INCORRECT_ENCODING;
|
|
1893 }
|
|
1894 encoding = newEncoding;
|
|
1895 }
|
|
1896 else if (encodingName) {
|
|
1897 enum XML_Error result;
|
|
1898 const XML_Char *s = poolStoreString(&tempPool,
|
|
1899 encoding,
|
|
1900 encodingName,
|
|
1901 encodingName
|
|
1902 + XmlNameLength(encoding, encodingName));
|
|
1903 if (!s)
|
|
1904 return XML_ERROR_NO_MEMORY;
|
|
1905 result = handleUnknownEncoding(parser, s);
|
|
1906 poolDiscard(&tempPool);
|
|
1907 if (result == XML_ERROR_UNKNOWN_ENCODING)
|
|
1908 eventPtr = encodingName;
|
|
1909 return result;
|
|
1910 }
|
|
1911 }
|
|
1912 return XML_ERROR_NONE;
|
|
1913 }
|
|
1914
|
|
1915 static enum XML_Error
|
|
1916 handleUnknownEncoding(XML_Parser parser, const XML_Char *encodingName)
|
|
1917 {
|
|
1918 if (unknownEncodingHandler) {
|
|
1919 XML_Encoding info;
|
|
1920 int i;
|
|
1921 for (i = 0; i < 256; i++)
|
|
1922 info.map[i] = -1;
|
|
1923 info.convert = 0;
|
|
1924 info.data = 0;
|
|
1925 info.release = 0;
|
|
1926 if (unknownEncodingHandler(unknownEncodingHandlerData, encodingName, &info)) {
|
|
1927 ENCODING *enc;
|
|
1928 unknownEncodingMem = malloc(XmlSizeOfUnknownEncoding());
|
|
1929 if (!unknownEncodingMem) {
|
|
1930 if (info.release)
|
|
1931 info.release(info.data);
|
|
1932 return XML_ERROR_NO_MEMORY;
|
|
1933 }
|
|
1934 enc = (ns
|
|
1935 ? XmlInitUnknownEncodingNS
|
|
1936 : XmlInitUnknownEncoding)(unknownEncodingMem,
|
|
1937 info.map,
|
|
1938 info.convert,
|
|
1939 info.data);
|
|
1940 if (enc) {
|
|
1941 unknownEncodingData = info.data;
|
|
1942 unknownEncodingRelease = info.release;
|
|
1943 encoding = enc;
|
|
1944 return XML_ERROR_NONE;
|
|
1945 }
|
|
1946 }
|
|
1947 if (info.release)
|
|
1948 info.release(info.data);
|
|
1949 }
|
|
1950 return XML_ERROR_UNKNOWN_ENCODING;
|
|
1951 }
|
|
1952
|
|
1953 static enum XML_Error
|
|
1954 prologInitProcessor(XML_Parser parser,
|
|
1955 const char *s,
|
|
1956 const char *end,
|
|
1957 const char **nextPtr)
|
|
1958 {
|
|
1959 enum XML_Error result = initializeEncoding(parser);
|
|
1960 if (result != XML_ERROR_NONE)
|
|
1961 return result;
|
|
1962 processor = prologProcessor;
|
|
1963 return prologProcessor(parser, s, end, nextPtr);
|
|
1964 }
|
|
1965
|
|
1966 static enum XML_Error
|
|
1967 prologProcessor(XML_Parser parser,
|
|
1968 const char *s,
|
|
1969 const char *end,
|
|
1970 const char **nextPtr)
|
|
1971 {
|
|
1972 for (;;) {
|
|
1973 const char *next;
|
|
1974 int tok = XmlPrologTok(encoding, s, end, &next);
|
|
1975 if (tok <= 0) {
|
|
1976 if (nextPtr != 0 && tok != XML_TOK_INVALID) {
|
|
1977 *nextPtr = s;
|
|
1978 return XML_ERROR_NONE;
|
|
1979 }
|
|
1980 switch (tok) {
|
|
1981 case XML_TOK_INVALID:
|
|
1982 eventPtr = next;
|
|
1983 return XML_ERROR_INVALID_TOKEN;
|
|
1984 case XML_TOK_NONE:
|
|
1985 return XML_ERROR_NO_ELEMENTS;
|
|
1986 case XML_TOK_PARTIAL:
|
|
1987 return XML_ERROR_UNCLOSED_TOKEN;
|
|
1988 case XML_TOK_PARTIAL_CHAR:
|
|
1989 return XML_ERROR_PARTIAL_CHAR;
|
|
1990 case XML_TOK_TRAILING_CR:
|
|
1991 eventPtr = s + encoding->minBytesPerChar;
|
|
1992 return XML_ERROR_NO_ELEMENTS;
|
|
1993 default:
|
|
1994 abort();
|
|
1995 }
|
|
1996 }
|
|
1997 switch (XmlTokenRole(&prologState, tok, s, next, encoding)) {
|
|
1998 case XML_ROLE_XML_DECL:
|
|
1999 {
|
|
2000 enum XML_Error result = processXmlDecl(parser, 0, s, next);
|
|
2001 if (result != XML_ERROR_NONE)
|
|
2002 return result;
|
|
2003 }
|
|
2004 break;
|
|
2005 case XML_ROLE_DOCTYPE_SYSTEM_ID:
|
|
2006 if (!dtd.standalone
|
|
2007 && notStandaloneHandler
|
|
2008 && !notStandaloneHandler(handlerArg))
|
|
2009 return XML_ERROR_NOT_STANDALONE;
|
|
2010 hadExternalDoctype = 1;
|
|
2011 break;
|
|
2012 case XML_ROLE_DOCTYPE_PUBLIC_ID:
|
|
2013 case XML_ROLE_ENTITY_PUBLIC_ID:
|
|
2014 if (!XmlIsPublicId(encoding, s, next, &eventPtr))
|
|
2015 return XML_ERROR_SYNTAX;
|
|
2016 if (declEntity) {
|
|
2017 XML_Char *tem = poolStoreString(&dtd.pool,
|
|
2018 encoding,
|
|
2019 s + encoding->minBytesPerChar,
|
|
2020 next - encoding->minBytesPerChar);
|
|
2021 if (!tem)
|
|
2022 return XML_ERROR_NO_MEMORY;
|
|
2023 normalizePublicId(tem);
|
|
2024 declEntity->publicId = tem;
|
|
2025 poolFinish(&dtd.pool);
|
|
2026 }
|
|
2027 break;
|
|
2028 case XML_ROLE_INSTANCE_START:
|
|
2029 processor = contentProcessor;
|
|
2030 if (hadExternalDoctype)
|
|
2031 dtd.complete = 0;
|
|
2032 return contentProcessor(parser, s, end, nextPtr);
|
|
2033 case XML_ROLE_ATTLIST_ELEMENT_NAME:
|
|
2034 {
|
|
2035 const XML_Char *name = poolStoreString(&dtd.pool, encoding, s, next);
|
|
2036 if (!name)
|
|
2037 return XML_ERROR_NO_MEMORY;
|
|
2038 declElementType = (ELEMENT_TYPE *)lookup(&dtd.elementTypes, name, sizeof(ELEMENT_TYPE));
|
|
2039 if (!declElementType)
|
|
2040 return XML_ERROR_NO_MEMORY;
|
|
2041 if (declElementType->name != name)
|
|
2042 poolDiscard(&dtd.pool);
|
|
2043 else {
|
|
2044 poolFinish(&dtd.pool);
|
|
2045 if (!setElementTypePrefix(parser, declElementType))
|
|
2046 return XML_ERROR_NO_MEMORY;
|
|
2047 }
|
|
2048 break;
|
|
2049 }
|
|
2050 case XML_ROLE_ATTRIBUTE_NAME:
|
|
2051 declAttributeId = getAttributeId(parser, encoding, s, next);
|
|
2052 if (!declAttributeId)
|
|
2053 return XML_ERROR_NO_MEMORY;
|
|
2054 declAttributeIsCdata = 0;
|
|
2055 break;
|
|
2056 case XML_ROLE_ATTRIBUTE_TYPE_CDATA:
|
|
2057 declAttributeIsCdata = 1;
|
|
2058 break;
|
|
2059 case XML_ROLE_IMPLIED_ATTRIBUTE_VALUE:
|
|
2060 case XML_ROLE_REQUIRED_ATTRIBUTE_VALUE:
|
|
2061 if (dtd.complete
|
|
2062 && !defineAttribute(declElementType, declAttributeId, declAttributeIsCdata, 0))
|
|
2063 return XML_ERROR_NO_MEMORY;
|
|
2064 break;
|
|
2065 case XML_ROLE_DEFAULT_ATTRIBUTE_VALUE:
|
|
2066 case XML_ROLE_FIXED_ATTRIBUTE_VALUE:
|
|
2067 {
|
|
2068 const XML_Char *attVal;
|
|
2069 enum XML_Error result
|
|
2070 = storeAttributeValue(parser, encoding, declAttributeIsCdata,
|
|
2071 s + encoding->minBytesPerChar,
|
|
2072 next - encoding->minBytesPerChar,
|
|
2073 &dtd.pool);
|
|
2074 if (result)
|
|
2075 return result;
|
|
2076 attVal = poolStart(&dtd.pool);
|
|
2077 poolFinish(&dtd.pool);
|
|
2078 if (dtd.complete
|
|
2079 && !defineAttribute(declElementType, declAttributeId, declAttributeIsCdata, attVal))
|
|
2080 return XML_ERROR_NO_MEMORY;
|
|
2081 break;
|
|
2082 }
|
|
2083 case XML_ROLE_ENTITY_VALUE:
|
|
2084 {
|
|
2085 enum XML_Error result = storeEntityValue(parser, s, next);
|
|
2086 if (result != XML_ERROR_NONE)
|
|
2087 return result;
|
|
2088 }
|
|
2089 break;
|
|
2090 case XML_ROLE_ENTITY_SYSTEM_ID:
|
|
2091 if (declEntity) {
|
|
2092 declEntity->systemId = poolStoreString(&dtd.pool, encoding,
|
|
2093 s + encoding->minBytesPerChar,
|
|
2094 next - encoding->minBytesPerChar);
|
|
2095 if (!declEntity->systemId)
|
|
2096 return XML_ERROR_NO_MEMORY;
|
|
2097 declEntity->base = dtd.base;
|
|
2098 poolFinish(&dtd.pool);
|
|
2099 }
|
|
2100 break;
|
|
2101 case XML_ROLE_ENTITY_NOTATION_NAME:
|
|
2102 if (declEntity) {
|
|
2103 declEntity->notation = poolStoreString(&dtd.pool, encoding, s, next);
|
|
2104 if (!declEntity->notation)
|
|
2105 return XML_ERROR_NO_MEMORY;
|
|
2106 poolFinish(&dtd.pool);
|
|
2107 if (unparsedEntityDeclHandler) {
|
|
2108 eventPtr = eventEndPtr = s;
|
|
2109 unparsedEntityDeclHandler(handlerArg,
|
|
2110 declEntity->name,
|
|
2111 declEntity->base,
|
|
2112 declEntity->systemId,
|
|
2113 declEntity->publicId,
|
|
2114 declEntity->notation);
|
|
2115 }
|
|
2116
|
|
2117 }
|
|
2118 break;
|
|
2119 case XML_ROLE_GENERAL_ENTITY_NAME:
|
|
2120 {
|
|
2121 const XML_Char *name;
|
|
2122 if (XmlPredefinedEntityName(encoding, s, next)) {
|
|
2123 declEntity = 0;
|
|
2124 break;
|
|
2125 }
|
|
2126 name = poolStoreString(&dtd.pool, encoding, s, next);
|
|
2127 if (!name)
|
|
2128 return XML_ERROR_NO_MEMORY;
|
|
2129 if (dtd.complete) {
|
|
2130 declEntity = (ENTITY *)lookup(&dtd.generalEntities, name, sizeof(ENTITY));
|
|
2131 if (!declEntity)
|
|
2132 return XML_ERROR_NO_MEMORY;
|
|
2133 if (declEntity->name != name) {
|
|
2134 poolDiscard(&dtd.pool);
|
|
2135 declEntity = 0;
|
|
2136 }
|
|
2137 else
|
|
2138 poolFinish(&dtd.pool);
|
|
2139 }
|
|
2140 else {
|
|
2141 poolDiscard(&dtd.pool);
|
|
2142 declEntity = 0;
|
|
2143 }
|
|
2144 }
|
|
2145 break;
|
|
2146 case XML_ROLE_PARAM_ENTITY_NAME:
|
|
2147 declEntity = 0;
|
|
2148 break;
|
|
2149 case XML_ROLE_NOTATION_NAME:
|
|
2150 declNotationPublicId = 0;
|
|
2151 declNotationName = 0;
|
|
2152 if (notationDeclHandler) {
|
|
2153 declNotationName = poolStoreString(&tempPool, encoding, s, next);
|
|
2154 if (!declNotationName)
|
|
2155 return XML_ERROR_NO_MEMORY;
|
|
2156 poolFinish(&tempPool);
|
|
2157 }
|
|
2158 break;
|
|
2159 case XML_ROLE_NOTATION_PUBLIC_ID:
|
|
2160 if (!XmlIsPublicId(encoding, s, next, &eventPtr))
|
|
2161 return XML_ERROR_SYNTAX;
|
|
2162 if (declNotationName) {
|
|
2163 XML_Char *tem = poolStoreString(&tempPool,
|
|
2164 encoding,
|
|
2165 s + encoding->minBytesPerChar,
|
|
2166 next - encoding->minBytesPerChar);
|
|
2167 if (!tem)
|
|
2168 return XML_ERROR_NO_MEMORY;
|
|
2169 normalizePublicId(tem);
|
|
2170 declNotationPublicId = tem;
|
|
2171 poolFinish(&tempPool);
|
|
2172 }
|
|
2173 break;
|
|
2174 case XML_ROLE_NOTATION_SYSTEM_ID:
|
|
2175 if (declNotationName && notationDeclHandler) {
|
|
2176 const XML_Char *systemId
|
|
2177 = poolStoreString(&tempPool, encoding,
|
|
2178 s + encoding->minBytesPerChar,
|
|
2179 next - encoding->minBytesPerChar);
|
|
2180 if (!systemId)
|
|
2181 return XML_ERROR_NO_MEMORY;
|
|
2182 eventPtr = eventEndPtr = s;
|
|
2183 notationDeclHandler(handlerArg,
|
|
2184 declNotationName,
|
|
2185 dtd.base,
|
|
2186 systemId,
|
|
2187 declNotationPublicId);
|
|
2188 }
|
|
2189 poolClear(&tempPool);
|
|
2190 break;
|
|
2191 case XML_ROLE_NOTATION_NO_SYSTEM_ID:
|
|
2192 if (declNotationPublicId && notationDeclHandler) {
|
|
2193 eventPtr = eventEndPtr = s;
|
|
2194 notationDeclHandler(handlerArg,
|
|
2195 declNotationName,
|
|
2196 dtd.base,
|
|
2197 0,
|
|
2198 declNotationPublicId);
|
|
2199 }
|
|
2200 poolClear(&tempPool);
|
|
2201 break;
|
|
2202 case XML_ROLE_ERROR:
|
|
2203 eventPtr = s;
|
|
2204 switch (tok) {
|
|
2205 case XML_TOK_PARAM_ENTITY_REF:
|
|
2206 return XML_ERROR_PARAM_ENTITY_REF;
|
|
2207 case XML_TOK_XML_DECL:
|
|
2208 return XML_ERROR_MISPLACED_XML_PI;
|
|
2209 default:
|
|
2210 return XML_ERROR_SYNTAX;
|
|
2211 }
|
|
2212 case XML_ROLE_GROUP_OPEN:
|
|
2213 if (prologState.level >= groupSize) {
|
|
2214 if (groupSize)
|
|
2215 groupConnector = realloc(groupConnector, groupSize *= 2);
|
|
2216 else
|
|
2217 groupConnector = malloc(groupSize = 32);
|
|
2218 if (!groupConnector)
|
|
2219 return XML_ERROR_NO_MEMORY;
|
|
2220 }
|
|
2221 groupConnector[prologState.level] = 0;
|
|
2222 break;
|
|
2223 case XML_ROLE_GROUP_SEQUENCE:
|
|
2224 if (groupConnector[prologState.level] == '|') {
|
|
2225 eventPtr = s;
|
|
2226 return XML_ERROR_SYNTAX;
|
|
2227 }
|
|
2228 groupConnector[prologState.level] = ',';
|
|
2229 break;
|
|
2230 case XML_ROLE_GROUP_CHOICE:
|
|
2231 if (groupConnector[prologState.level] == ',') {
|
|
2232 eventPtr = s;
|
|
2233 return XML_ERROR_SYNTAX;
|
|
2234 }
|
|
2235 groupConnector[prologState.level] = '|';
|
|
2236 break;
|
|
2237 case XML_ROLE_PARAM_ENTITY_REF:
|
|
2238 if (!dtd.standalone
|
|
2239 && notStandaloneHandler
|
|
2240 && !notStandaloneHandler(handlerArg))
|
|
2241 return XML_ERROR_NOT_STANDALONE;
|
|
2242 dtd.complete = 0;
|
|
2243 break;
|
|
2244 case XML_ROLE_NONE:
|
|
2245 switch (tok) {
|
|
2246 case XML_TOK_PI:
|
|
2247 eventPtr = s;
|
|
2248 eventEndPtr = next;
|
|
2249 if (!reportProcessingInstruction(parser, encoding, s, next))
|
|
2250 return XML_ERROR_NO_MEMORY;
|
|
2251 break;
|
|
2252 case XML_TOK_COMMENT:
|
|
2253 eventPtr = s;
|
|
2254 eventEndPtr = next;
|
|
2255 if (!reportComment(parser, encoding, s, next))
|
|
2256 return XML_ERROR_NO_MEMORY;
|
|
2257 break;
|
|
2258 }
|
|
2259 break;
|
|
2260 }
|
|
2261 if (defaultHandler) {
|
|
2262 switch (tok) {
|
|
2263 case XML_TOK_PI:
|
|
2264 case XML_TOK_COMMENT:
|
|
2265 case XML_TOK_BOM:
|
|
2266 case XML_TOK_XML_DECL:
|
|
2267 break;
|
|
2268 default:
|
|
2269 eventPtr = s;
|
|
2270 eventEndPtr = next;
|
|
2271 reportDefault(parser, encoding, s, next);
|
|
2272 }
|
|
2273 }
|
|
2274 s = next;
|
|
2275 }
|
|
2276 /* not reached */
|
|
2277 }
|
|
2278
|
|
2279 static
|
|
2280 enum XML_Error epilogProcessor(XML_Parser parser,
|
|
2281 const char *s,
|
|
2282 const char *end,
|
|
2283 const char **nextPtr)
|
|
2284 {
|
|
2285 processor = epilogProcessor;
|
|
2286 eventPtr = s;
|
|
2287 for (;;) {
|
|
2288 const char *next;
|
|
2289 int tok = XmlPrologTok(encoding, s, end, &next);
|
|
2290 eventEndPtr = next;
|
|
2291 switch (tok) {
|
|
2292 case XML_TOK_TRAILING_CR:
|
|
2293 if (defaultHandler) {
|
|
2294 eventEndPtr = end;
|
|
2295 reportDefault(parser, encoding, s, end);
|
|
2296 }
|
|
2297 /* fall through */
|
|
2298 case XML_TOK_NONE:
|
|
2299 if (nextPtr)
|
|
2300 *nextPtr = end;
|
|
2301 return XML_ERROR_NONE;
|
|
2302 case XML_TOK_PROLOG_S:
|
|
2303 if (defaultHandler)
|
|
2304 reportDefault(parser, encoding, s, next);
|
|
2305 break;
|
|
2306 case XML_TOK_PI:
|
|
2307 if (!reportProcessingInstruction(parser, encoding, s, next))
|
|
2308 return XML_ERROR_NO_MEMORY;
|
|
2309 break;
|
|
2310 case XML_TOK_COMMENT:
|
|
2311 if (!reportComment(parser, encoding, s, next))
|
|
2312 return XML_ERROR_NO_MEMORY;
|
|
2313 break;
|
|
2314 case XML_TOK_INVALID:
|
|
2315 eventPtr = next;
|
|
2316 return XML_ERROR_INVALID_TOKEN;
|
|
2317 case XML_TOK_PARTIAL:
|
|
2318 if (nextPtr) {
|
|
2319 *nextPtr = s;
|
|
2320 return XML_ERROR_NONE;
|
|
2321 }
|
|
2322 return XML_ERROR_UNCLOSED_TOKEN;
|
|
2323 case XML_TOK_PARTIAL_CHAR:
|
|
2324 if (nextPtr) {
|
|
2325 *nextPtr = s;
|
|
2326 return XML_ERROR_NONE;
|
|
2327 }
|
|
2328 return XML_ERROR_PARTIAL_CHAR;
|
|
2329 default:
|
|
2330 return XML_ERROR_JUNK_AFTER_DOC_ELEMENT;
|
|
2331 }
|
|
2332 eventPtr = s = next;
|
|
2333 }
|
|
2334 }
|
|
2335
|
|
2336 static
|
|
2337 enum XML_Error errorProcessor(XML_Parser parser,
|
|
2338 const char *s,
|
|
2339 const char *end,
|
|
2340 const char **nextPtr)
|
|
2341 {
|
|
2342 return errorCode;
|
|
2343 }
|
|
2344
|
|
2345 static enum XML_Error
|
|
2346 storeAttributeValue(XML_Parser parser, const ENCODING *enc, int isCdata,
|
|
2347 const char *ptr, const char *end,
|
|
2348 STRING_POOL *pool)
|
|
2349 {
|
|
2350 enum XML_Error result = appendAttributeValue(parser, enc, isCdata, ptr, end, pool);
|
|
2351 if (result)
|
|
2352 return result;
|
|
2353 if (!isCdata && poolLength(pool) && poolLastChar(pool) == 0x20)
|
|
2354 poolChop(pool);
|
|
2355 if (!poolAppendChar(pool, XML_T('\0')))
|
|
2356 return XML_ERROR_NO_MEMORY;
|
|
2357 return XML_ERROR_NONE;
|
|
2358 }
|
|
2359
|
|
2360 static enum XML_Error
|
|
2361 appendAttributeValue(XML_Parser parser, const ENCODING *enc, int isCdata,
|
|
2362 const char *ptr, const char *end,
|
|
2363 STRING_POOL *pool)
|
|
2364 {
|
|
2365 const ENCODING *internalEnc = ns ? XmlGetInternalEncodingNS() : XmlGetInternalEncoding();
|
|
2366 for (;;) {
|
|
2367 const char *next;
|
|
2368 int tok = XmlAttributeValueTok(enc, ptr, end, &next);
|
|
2369 switch (tok) {
|
|
2370 case XML_TOK_NONE:
|
|
2371 return XML_ERROR_NONE;
|
|
2372 case XML_TOK_INVALID:
|
|
2373 if (enc == encoding)
|
|
2374 eventPtr = next;
|
|
2375 return XML_ERROR_INVALID_TOKEN;
|
|
2376 case XML_TOK_PARTIAL:
|
|
2377 if (enc == encoding)
|
|
2378 eventPtr = ptr;
|
|
2379 return XML_ERROR_INVALID_TOKEN;
|
|
2380 case XML_TOK_CHAR_REF:
|
|
2381 {
|
|
2382 XML_Char buf[XML_ENCODE_MAX];
|
|
2383 int i;
|
|
2384 int n = XmlCharRefNumber(enc, ptr);
|
|
2385 if (n < 0) {
|
|
2386 if (enc == encoding)
|
|
2387 eventPtr = ptr;
|
|
2388 return XML_ERROR_BAD_CHAR_REF;
|
|
2389 }
|
|
2390 if (!isCdata
|
|
2391 && n == 0x20 /* space */
|
|
2392 && (poolLength(pool) == 0 || poolLastChar(pool) == 0x20))
|
|
2393 break;
|
|
2394 n = XmlEncode(n, (ICHAR *)buf);
|
|
2395 if (!n) {
|
|
2396 if (enc == encoding)
|
|
2397 eventPtr = ptr;
|
|
2398 return XML_ERROR_BAD_CHAR_REF;
|
|
2399 }
|
|
2400 for (i = 0; i < n; i++) {
|
|
2401 if (!poolAppendChar(pool, buf[i]))
|
|
2402 return XML_ERROR_NO_MEMORY;
|
|
2403 }
|
|
2404 }
|
|
2405 break;
|
|
2406 case XML_TOK_DATA_CHARS:
|
|
2407 if (!poolAppend(pool, enc, ptr, next))
|
|
2408 return XML_ERROR_NO_MEMORY;
|
|
2409 break;
|
|
2410 break;
|
|
2411 case XML_TOK_TRAILING_CR:
|
|
2412 next = ptr + enc->minBytesPerChar;
|
|
2413 /* fall through */
|
|
2414 case XML_TOK_ATTRIBUTE_VALUE_S:
|
|
2415 case XML_TOK_DATA_NEWLINE:
|
|
2416 if (!isCdata && (poolLength(pool) == 0 || poolLastChar(pool) == 0x20))
|
|
2417 break;
|
|
2418 if (!poolAppendChar(pool, 0x20))
|
|
2419 return XML_ERROR_NO_MEMORY;
|
|
2420 break;
|
|
2421 case XML_TOK_ENTITY_REF:
|
|
2422 {
|
|
2423 const XML_Char *name;
|
|
2424 ENTITY *entity;
|
|
2425 XML_Char ch = XmlPredefinedEntityName(enc,
|
|
2426 ptr + enc->minBytesPerChar,
|
|
2427 next - enc->minBytesPerChar);
|
|
2428 if (ch) {
|
|
2429 if (!poolAppendChar(pool, ch))
|
|
2430 return XML_ERROR_NO_MEMORY;
|
|
2431 break;
|
|
2432 }
|
|
2433 name = poolStoreString(&temp2Pool, enc,
|
|
2434 ptr + enc->minBytesPerChar,
|
|
2435 next - enc->minBytesPerChar);
|
|
2436 if (!name)
|
|
2437 return XML_ERROR_NO_MEMORY;
|
|
2438 entity = (ENTITY *)lookup(&dtd.generalEntities, name, 0);
|
|
2439 poolDiscard(&temp2Pool);
|
|
2440 if (!entity) {
|
|
2441 if (dtd.complete) {
|
|
2442 if (enc == encoding)
|
|
2443 eventPtr = ptr;
|
|
2444 return XML_ERROR_UNDEFINED_ENTITY;
|
|
2445 }
|
|
2446 }
|
|
2447 else if (entity->open) {
|
|
2448 if (enc == encoding)
|
|
2449 eventPtr = ptr;
|
|
2450 return XML_ERROR_RECURSIVE_ENTITY_REF;
|
|
2451 }
|
|
2452 else if (entity->notation) {
|
|
2453 if (enc == encoding)
|
|
2454 eventPtr = ptr;
|
|
2455 return XML_ERROR_BINARY_ENTITY_REF;
|
|
2456 }
|
|
2457 else if (!entity->textPtr) {
|
|
2458 if (enc == encoding)
|
|
2459 eventPtr = ptr;
|
|
2460 return XML_ERROR_ATTRIBUTE_EXTERNAL_ENTITY_REF;
|
|
2461 }
|
|
2462 else {
|
|
2463 enum XML_Error result;
|
|
2464 const XML_Char *textEnd = entity->textPtr + entity->textLen;
|
|
2465 entity->open = 1;
|
|
2466 result = appendAttributeValue(parser, internalEnc, isCdata, (char *)entity->textPtr, (char *)textEnd, pool);
|
|
2467 entity->open = 0;
|
|
2468 if (result)
|
|
2469 return result;
|
|
2470 }
|
|
2471 }
|
|
2472 break;
|
|
2473 default:
|
|
2474 abort();
|
|
2475 }
|
|
2476 ptr = next;
|
|
2477 }
|
|
2478 /* not reached */
|
|
2479 }
|
|
2480
|
|
2481 static
|
|
2482 enum XML_Error storeEntityValue(XML_Parser parser,
|
|
2483 const char *entityTextPtr,
|
|
2484 const char *entityTextEnd)
|
|
2485 {
|
|
2486 const ENCODING *internalEnc = ns ? XmlGetInternalEncodingNS() : XmlGetInternalEncoding();
|
|
2487 STRING_POOL *pool = &(dtd.pool);
|
|
2488 entityTextPtr += encoding->minBytesPerChar;
|
|
2489 entityTextEnd -= encoding->minBytesPerChar;
|
|
2490 for (;;) {
|
|
2491 const char *next;
|
|
2492 int tok = XmlEntityValueTok(encoding, entityTextPtr, entityTextEnd, &next);
|
|
2493 switch (tok) {
|
|
2494 case XML_TOK_PARAM_ENTITY_REF:
|
|
2495 eventPtr = entityTextPtr;
|
|
2496 return XML_ERROR_SYNTAX;
|
|
2497 case XML_TOK_NONE:
|
|
2498 if (declEntity) {
|
|
2499 declEntity->textPtr = pool->start;
|
|
2500 declEntity->textLen = pool->ptr - pool->start;
|
|
2501 poolFinish(pool);
|
|
2502 }
|
|
2503 else
|
|
2504 poolDiscard(pool);
|
|
2505 return XML_ERROR_NONE;
|
|
2506 case XML_TOK_ENTITY_REF:
|
|
2507 case XML_TOK_DATA_CHARS:
|
|
2508 if (!poolAppend(pool, encoding, entityTextPtr, next))
|
|
2509 return XML_ERROR_NO_MEMORY;
|
|
2510 break;
|
|
2511 case XML_TOK_TRAILING_CR:
|
|
2512 next = entityTextPtr + encoding->minBytesPerChar;
|
|
2513 /* fall through */
|
|
2514 case XML_TOK_DATA_NEWLINE:
|
|
2515 if (pool->end == pool->ptr && !poolGrow(pool))
|
|
2516 return XML_ERROR_NO_MEMORY;
|
|
2517 *(pool->ptr)++ = 0xA;
|
|
2518 break;
|
|
2519 case XML_TOK_CHAR_REF:
|
|
2520 {
|
|
2521 XML_Char buf[XML_ENCODE_MAX];
|
|
2522 int i;
|
|
2523 int n = XmlCharRefNumber(encoding, entityTextPtr);
|
|
2524 if (n < 0) {
|
|
2525 eventPtr = entityTextPtr;
|
|
2526 return XML_ERROR_BAD_CHAR_REF;
|
|
2527 }
|
|
2528 n = XmlEncode(n, (ICHAR *)buf);
|
|
2529 if (!n) {
|
|
2530 eventPtr = entityTextPtr;
|
|
2531 return XML_ERROR_BAD_CHAR_REF;
|
|
2532 }
|
|
2533 for (i = 0; i < n; i++) {
|
|
2534 if (pool->end == pool->ptr && !poolGrow(pool))
|
|
2535 return XML_ERROR_NO_MEMORY;
|
|
2536 *(pool->ptr)++ = buf[i];
|
|
2537 }
|
|
2538 }
|
|
2539 break;
|
|
2540 case XML_TOK_PARTIAL:
|
|
2541 eventPtr = entityTextPtr;
|
|
2542 return XML_ERROR_INVALID_TOKEN;
|
|
2543 case XML_TOK_INVALID:
|
|
2544 eventPtr = next;
|
|
2545 return XML_ERROR_INVALID_TOKEN;
|
|
2546 default:
|
|
2547 abort();
|
|
2548 }
|
|
2549 entityTextPtr = next;
|
|
2550 }
|
|
2551 /* not reached */
|
|
2552 }
|
|
2553
|
|
2554 static void
|
|
2555 normalizeLines(XML_Char *s)
|
|
2556 {
|
|
2557 XML_Char *p;
|
|
2558 for (;; s++) {
|
|
2559 if (*s == XML_T('\0'))
|
|
2560 return;
|
|
2561 if (*s == 0xD)
|
|
2562 break;
|
|
2563 }
|
|
2564 p = s;
|
|
2565 do {
|
|
2566 if (*s == 0xD) {
|
|
2567 *p++ = 0xA;
|
|
2568 if (*++s == 0xA)
|
|
2569 s++;
|
|
2570 }
|
|
2571 else
|
|
2572 *p++ = *s++;
|
|
2573 } while (*s);
|
|
2574 *p = XML_T('\0');
|
|
2575 }
|
|
2576
|
|
2577 static int
|
|
2578 reportProcessingInstruction(XML_Parser parser, const ENCODING *enc, const char *start, const char *end)
|
|
2579 {
|
|
2580 const XML_Char *target;
|
|
2581 XML_Char *data;
|
|
2582 const char *tem;
|
|
2583 if (!processingInstructionHandler) {
|
|
2584 if (defaultHandler)
|
|
2585 reportDefault(parser, enc, start, end);
|
|
2586 return 1;
|
|
2587 }
|
|
2588 start += enc->minBytesPerChar * 2;
|
|
2589 tem = start + XmlNameLength(enc, start);
|
|
2590 target = poolStoreString(&tempPool, enc, start, tem);
|
|
2591 if (!target)
|
|
2592 return 0;
|
|
2593 poolFinish(&tempPool);
|
|
2594 data = poolStoreString(&tempPool, enc,
|
|
2595 XmlSkipS(enc, tem),
|
|
2596 end - enc->minBytesPerChar*2);
|
|
2597 if (!data)
|
|
2598 return 0;
|
|
2599 normalizeLines(data);
|
|
2600 processingInstructionHandler(handlerArg, target, data);
|
|
2601 poolClear(&tempPool);
|
|
2602 return 1;
|
|
2603 }
|
|
2604
|
|
2605 static int
|
|
2606 reportComment(XML_Parser parser, const ENCODING *enc, const char *start, const char *end)
|
|
2607 {
|
|
2608 XML_Char *data;
|
|
2609 if (!commentHandler) {
|
|
2610 if (defaultHandler)
|
|
2611 reportDefault(parser, enc, start, end);
|
|
2612 return 1;
|
|
2613 }
|
|
2614 data = poolStoreString(&tempPool,
|
|
2615 enc,
|
|
2616 start + enc->minBytesPerChar * 4,
|
|
2617 end - enc->minBytesPerChar * 3);
|
|
2618 if (!data)
|
|
2619 return 0;
|
|
2620 normalizeLines(data);
|
|
2621 commentHandler(handlerArg, data);
|
|
2622 poolClear(&tempPool);
|
|
2623 return 1;
|
|
2624 }
|
|
2625
|
|
2626 static void
|
|
2627 reportDefault(XML_Parser parser, const ENCODING *enc, const char *s, const char *end)
|
|
2628 {
|
|
2629 if (MUST_CONVERT(enc, s)) {
|
|
2630 const char **eventPP;
|
|
2631 const char **eventEndPP;
|
|
2632 if (enc == encoding) {
|
|
2633 eventPP = &eventPtr;
|
|
2634 eventEndPP = &eventEndPtr;
|
|
2635 }
|
|
2636 else {
|
|
2637 eventPP = &(openInternalEntities->internalEventPtr);
|
|
2638 eventEndPP = &(openInternalEntities->internalEventEndPtr);
|
|
2639 }
|
|
2640 do {
|
|
2641 ICHAR *dataPtr = (ICHAR *)dataBuf;
|
|
2642 XmlConvert(enc, &s, end, &dataPtr, (ICHAR *)dataBufEnd);
|
|
2643 *eventEndPP = s;
|
|
2644 defaultHandler(handlerArg, dataBuf, dataPtr - (ICHAR *)dataBuf);
|
|
2645 *eventPP = s;
|
|
2646 } while (s != end);
|
|
2647 }
|
|
2648 else
|
|
2649 defaultHandler(handlerArg, (XML_Char *)s, (XML_Char *)end - (XML_Char *)s);
|
|
2650 }
|
|
2651
|
|
2652
|
|
2653 static int
|
|
2654 defineAttribute(ELEMENT_TYPE *type, ATTRIBUTE_ID *attId, int isCdata, const XML_Char *value)
|
|
2655 {
|
|
2656 DEFAULT_ATTRIBUTE *att;
|
|
2657 if (type->nDefaultAtts == type->allocDefaultAtts) {
|
|
2658 if (type->allocDefaultAtts == 0) {
|
|
2659 type->allocDefaultAtts = 8;
|
|
2660 type->defaultAtts = malloc(type->allocDefaultAtts*sizeof(DEFAULT_ATTRIBUTE));
|
|
2661 }
|
|
2662 else {
|
|
2663 type->allocDefaultAtts *= 2;
|
|
2664 type->defaultAtts = realloc(type->defaultAtts,
|
|
2665 type->allocDefaultAtts*sizeof(DEFAULT_ATTRIBUTE));
|
|
2666 }
|
|
2667 if (!type->defaultAtts)
|
|
2668 return 0;
|
|
2669 }
|
|
2670 att = type->defaultAtts + type->nDefaultAtts;
|
|
2671 att->id = attId;
|
|
2672 att->value = value;
|
|
2673 att->isCdata = isCdata;
|
|
2674 if (!isCdata)
|
|
2675 attId->maybeTokenized = 1;
|
|
2676 type->nDefaultAtts += 1;
|
|
2677 return 1;
|
|
2678 }
|
|
2679
|
|
2680 static int setElementTypePrefix(XML_Parser parser, ELEMENT_TYPE *elementType)
|
|
2681 {
|
|
2682 const XML_Char *name;
|
|
2683 for (name = elementType->name; *name; name++) {
|
|
2684 if (*name == XML_T(':')) {
|
|
2685 PREFIX *prefix;
|
|
2686 const XML_Char *s;
|
|
2687 for (s = elementType->name; s != name; s++) {
|
|
2688 if (!poolAppendChar(&dtd.pool, *s))
|
|
2689 return 0;
|
|
2690 }
|
|
2691 if (!poolAppendChar(&dtd.pool, XML_T('\0')))
|
|
2692 return 0;
|
|
2693 prefix = (PREFIX *)lookup(&dtd.prefixes, poolStart(&dtd.pool), sizeof(PREFIX));
|
|
2694 if (!prefix)
|
|
2695 return 0;
|
|
2696 if (prefix->name == poolStart(&dtd.pool))
|
|
2697 poolFinish(&dtd.pool);
|
|
2698 else
|
|
2699 poolDiscard(&dtd.pool);
|
|
2700 elementType->prefix = prefix;
|
|
2701
|
|
2702 }
|
|
2703 }
|
|
2704 return 1;
|
|
2705 }
|
|
2706
|
|
2707 static ATTRIBUTE_ID *
|
|
2708 getAttributeId(XML_Parser parser, const ENCODING *enc, const char *start, const char *end)
|
|
2709 {
|
|
2710 ATTRIBUTE_ID *id;
|
|
2711 const XML_Char *name;
|
|
2712 if (!poolAppendChar(&dtd.pool, XML_T('\0')))
|
|
2713 return 0;
|
|
2714 name = poolStoreString(&dtd.pool, enc, start, end);
|
|
2715 if (!name)
|
|
2716 return 0;
|
|
2717 ++name;
|
|
2718 id = (ATTRIBUTE_ID *)lookup(&dtd.attributeIds, name, sizeof(ATTRIBUTE_ID));
|
|
2719 if (!id)
|
|
2720 return 0;
|
|
2721 if (id->name != name)
|
|
2722 poolDiscard(&dtd.pool);
|
|
2723 else {
|
|
2724 poolFinish(&dtd.pool);
|
|
2725 if (!ns)
|
|
2726 ;
|
|
2727 else if (name[0] == 'x'
|
|
2728 && name[1] == 'm'
|
|
2729 && name[2] == 'l'
|
|
2730 && name[3] == 'n'
|
|
2731 && name[4] == 's'
|
|
2732 && (name[5] == XML_T('\0') || name[5] == XML_T(':'))) {
|
|
2733 if (name[5] == '\0')
|
|
2734 id->prefix = &dtd.defaultPrefix;
|
|
2735 else
|
|
2736 id->prefix = (PREFIX *)lookup(&dtd.prefixes, name + 6, sizeof(PREFIX));
|
|
2737 id->xmlns = 1;
|
|
2738 }
|
|
2739 else {
|
|
2740 int i;
|
|
2741 for (i = 0; name[i]; i++) {
|
|
2742 if (name[i] == XML_T(':')) {
|
|
2743 int j;
|
|
2744 for (j = 0; j < i; j++) {
|
|
2745 if (!poolAppendChar(&dtd.pool, name[j]))
|
|
2746 return 0;
|
|
2747 }
|
|
2748 if (!poolAppendChar(&dtd.pool, XML_T('\0')))
|
|
2749 return 0;
|
|
2750 id->prefix = (PREFIX *)lookup(&dtd.prefixes, poolStart(&dtd.pool), sizeof(PREFIX));
|
|
2751 if (id->prefix->name == poolStart(&dtd.pool))
|
|
2752 poolFinish(&dtd.pool);
|
|
2753 else
|
|
2754 poolDiscard(&dtd.pool);
|
|
2755 break;
|
|
2756 }
|
|
2757 }
|
|
2758 }
|
|
2759 }
|
|
2760 return id;
|
|
2761 }
|
|
2762
|
|
2763 #define CONTEXT_SEP XML_T('\f')
|
|
2764
|
|
2765 static
|
|
2766 const XML_Char *getContext(XML_Parser parser)
|
|
2767 {
|
|
2768 HASH_TABLE_ITER iter;
|
|
2769 int needSep = 0;
|
|
2770
|
|
2771 if (dtd.defaultPrefix.binding) {
|
|
2772 int i;
|
|
2773 int len;
|
|
2774 if (!poolAppendChar(&tempPool, XML_T('=')))
|
|
2775 return 0;
|
|
2776 len = dtd.defaultPrefix.binding->uriLen;
|
|
2777 if (namespaceSeparator != XML_T('\0'))
|
|
2778 len--;
|
|
2779 for (i = 0; i < len; i++)
|
|
2780 if (!poolAppendChar(&tempPool, dtd.defaultPrefix.binding->uri[i]))
|
|
2781 return 0;
|
|
2782 needSep = 1;
|
|
2783 }
|
|
2784
|
|
2785 hashTableIterInit(&iter, &(dtd.prefixes));
|
|
2786 for (;;) {
|
|
2787 int i;
|
|
2788 int len;
|
|
2789 const XML_Char *s;
|
|
2790 PREFIX *prefix = (PREFIX *)hashTableIterNext(&iter);
|
|
2791 if (!prefix)
|
|
2792 break;
|
|
2793 if (!prefix->binding)
|
|
2794 continue;
|
|
2795 if (needSep && !poolAppendChar(&tempPool, CONTEXT_SEP))
|
|
2796 return 0;
|
|
2797 for (s = prefix->name; *s; s++)
|
|
2798 if (!poolAppendChar(&tempPool, *s))
|
|
2799 return 0;
|
|
2800 if (!poolAppendChar(&tempPool, XML_T('=')))
|
|
2801 return 0;
|
|
2802 len = prefix->binding->uriLen;
|
|
2803 if (namespaceSeparator != XML_T('\0'))
|
|
2804 len--;
|
|
2805 for (i = 0; i < len; i++)
|
|
2806 if (!poolAppendChar(&tempPool, prefix->binding->uri[i]))
|
|
2807 return 0;
|
|
2808 needSep = 1;
|
|
2809 }
|
|
2810
|
|
2811
|
|
2812 hashTableIterInit(&iter, &(dtd.generalEntities));
|
|
2813 for (;;) {
|
|
2814 const XML_Char *s;
|
|
2815 ENTITY *e = (ENTITY *)hashTableIterNext(&iter);
|
|
2816 if (!e)
|
|
2817 break;
|
|
2818 if (!e->open)
|
|
2819 continue;
|
|
2820 if (needSep && !poolAppendChar(&tempPool, CONTEXT_SEP))
|
|
2821 return 0;
|
|
2822 for (s = e->name; *s; s++)
|
|
2823 if (!poolAppendChar(&tempPool, *s))
|
|
2824 return 0;
|
|
2825 needSep = 1;
|
|
2826 }
|
|
2827
|
|
2828 if (!poolAppendChar(&tempPool, XML_T('\0')))
|
|
2829 return 0;
|
|
2830 return tempPool.start;
|
|
2831 }
|
|
2832
|
|
2833 static
|
|
2834 int setContext(XML_Parser parser, const XML_Char *context)
|
|
2835 {
|
|
2836 const XML_Char *s = context;
|
|
2837
|
|
2838 while (*context != XML_T('\0')) {
|
|
2839 if (*s == CONTEXT_SEP || *s == XML_T('\0')) {
|
|
2840 ENTITY *e;
|
|
2841 if (!poolAppendChar(&tempPool, XML_T('\0')))
|
|
2842 return 0;
|
|
2843 e = (ENTITY *)lookup(&dtd.generalEntities, poolStart(&tempPool), 0);
|
|
2844 if (e)
|
|
2845 e->open = 1;
|
|
2846 if (*s != XML_T('\0'))
|
|
2847 s++;
|
|
2848 context = s;
|
|
2849 poolDiscard(&tempPool);
|
|
2850 }
|
|
2851 else if (*s == '=') {
|
|
2852 PREFIX *prefix;
|
|
2853 if (poolLength(&tempPool) == 0)
|
|
2854 prefix = &dtd.defaultPrefix;
|
|
2855 else {
|
|
2856 if (!poolAppendChar(&tempPool, XML_T('\0')))
|
|
2857 return 0;
|
|
2858 prefix = (PREFIX *)lookup(&dtd.prefixes, poolStart(&tempPool), sizeof(PREFIX));
|
|
2859 if (!prefix)
|
|
2860 return 0;
|
|
2861 if (prefix->name == poolStart(&tempPool))
|
|
2862 poolFinish(&tempPool);
|
|
2863 else
|
|
2864 poolDiscard(&tempPool);
|
|
2865 }
|
|
2866 for (context = s + 1; *context != CONTEXT_SEP && *context != XML_T('\0'); context++)
|
|
2867 if (!poolAppendChar(&tempPool, *context))
|
|
2868 return 0;
|
|
2869 if (!poolAppendChar(&tempPool, XML_T('\0')))
|
|
2870 return 0;
|
|
2871 if (!addBinding(parser, prefix, 0, poolStart(&tempPool), &inheritedBindings))
|
|
2872 return 0;
|
|
2873 poolDiscard(&tempPool);
|
|
2874 if (*context != XML_T('\0'))
|
|
2875 ++context;
|
|
2876 s = context;
|
|
2877 }
|
|
2878 else {
|
|
2879 if (!poolAppendChar(&tempPool, *s))
|
|
2880 return 0;
|
|
2881 s++;
|
|
2882 }
|
|
2883 }
|
|
2884 return 1;
|
|
2885 }
|
|
2886
|
|
2887
|
|
2888 static
|
|
2889 void normalizePublicId(XML_Char *publicId)
|
|
2890 {
|
|
2891 XML_Char *p = publicId;
|
|
2892 XML_Char *s;
|
|
2893 for (s = publicId; *s; s++) {
|
|
2894 switch (*s) {
|
|
2895 case 0x20:
|
|
2896 case 0xD:
|
|
2897 case 0xA:
|
|
2898 if (p != publicId && p[-1] != 0x20)
|
|
2899 *p++ = 0x20;
|
|
2900 break;
|
|
2901 default:
|
|
2902 *p++ = *s;
|
|
2903 }
|
|
2904 }
|
|
2905 if (p != publicId && p[-1] == 0x20)
|
|
2906 --p;
|
|
2907 *p = XML_T('\0');
|
|
2908 }
|
|
2909
|
|
2910 static int dtdInit(DTD *p)
|
|
2911 {
|
|
2912 poolInit(&(p->pool));
|
|
2913 hashTableInit(&(p->generalEntities));
|
|
2914 hashTableInit(&(p->elementTypes));
|
|
2915 hashTableInit(&(p->attributeIds));
|
|
2916 hashTableInit(&(p->prefixes));
|
|
2917 p->complete = 1;
|
|
2918 p->standalone = 0;
|
|
2919 p->base = 0;
|
|
2920 p->defaultPrefix.name = 0;
|
|
2921 p->defaultPrefix.binding = 0;
|
|
2922 return 1;
|
|
2923 }
|
|
2924
|
|
2925 static void dtdDestroy(DTD *p)
|
|
2926 {
|
|
2927 HASH_TABLE_ITER iter;
|
|
2928 hashTableIterInit(&iter, &(p->elementTypes));
|
|
2929 for (;;) {
|
|
2930 ELEMENT_TYPE *e = (ELEMENT_TYPE *)hashTableIterNext(&iter);
|
|
2931 if (!e)
|
|
2932 break;
|
|
2933 if (e->allocDefaultAtts != 0)
|
|
2934 free(e->defaultAtts);
|
|
2935 }
|
|
2936 hashTableDestroy(&(p->generalEntities));
|
|
2937 hashTableDestroy(&(p->elementTypes));
|
|
2938 hashTableDestroy(&(p->attributeIds));
|
|
2939 hashTableDestroy(&(p->prefixes));
|
|
2940 poolDestroy(&(p->pool));
|
|
2941 }
|
|
2942
|
|
2943 /* Do a deep copy of the DTD. Return 0 for out of memory; non-zero otherwise.
|
|
2944 The new DTD has already been initialized. */
|
|
2945
|
|
2946 static int dtdCopy(DTD *newDtd, const DTD *oldDtd)
|
|
2947 {
|
|
2948 HASH_TABLE_ITER iter;
|
|
2949
|
|
2950 if (oldDtd->base) {
|
|
2951 const XML_Char *tem = poolCopyString(&(newDtd->pool), oldDtd->base);
|
|
2952 if (!tem)
|
|
2953 return 0;
|
|
2954 newDtd->base = tem;
|
|
2955 }
|
|
2956
|
|
2957 /* Copy the prefix table. */
|
|
2958
|
|
2959 hashTableIterInit(&iter, &(oldDtd->prefixes));
|
|
2960 for (;;) {
|
|
2961 const XML_Char *name;
|
|
2962 const PREFIX *oldP = (PREFIX *)hashTableIterNext(&iter);
|
|
2963 if (!oldP)
|
|
2964 break;
|
|
2965 name = poolCopyString(&(newDtd->pool), oldP->name);
|
|
2966 if (!name)
|
|
2967 return 0;
|
|
2968 if (!lookup(&(newDtd->prefixes), name, sizeof(PREFIX)))
|
|
2969 return 0;
|
|
2970 }
|
|
2971
|
|
2972 hashTableIterInit(&iter, &(oldDtd->attributeIds));
|
|
2973
|
|
2974 /* Copy the attribute id table. */
|
|
2975
|
|
2976 for (;;) {
|
|
2977 ATTRIBUTE_ID *newA;
|
|
2978 const XML_Char *name;
|
|
2979 const ATTRIBUTE_ID *oldA = (ATTRIBUTE_ID *)hashTableIterNext(&iter);
|
|
2980
|
|
2981 if (!oldA)
|
|
2982 break;
|
|
2983 /* Remember to allocate the scratch byte before the name. */
|
|
2984 if (!poolAppendChar(&(newDtd->pool), XML_T('\0')))
|
|
2985 return 0;
|
|
2986 name = poolCopyString(&(newDtd->pool), oldA->name);
|
|
2987 if (!name)
|
|
2988 return 0;
|
|
2989 ++name;
|
|
2990 newA = (ATTRIBUTE_ID *)lookup(&(newDtd->attributeIds), name, sizeof(ATTRIBUTE_ID));
|
|
2991 if (!newA)
|
|
2992 return 0;
|
|
2993 newA->maybeTokenized = oldA->maybeTokenized;
|
|
2994 if (oldA->prefix) {
|
|
2995 newA->xmlns = oldA->xmlns;
|
|
2996 if (oldA->prefix == &oldDtd->defaultPrefix)
|
|
2997 newA->prefix = &newDtd->defaultPrefix;
|
|
2998 else
|
|
2999 newA->prefix = (PREFIX *)lookup(&(newDtd->prefixes), oldA->prefix->name, 0);
|
|
3000 }
|
|
3001 }
|
|
3002
|
|
3003 /* Copy the element type table. */
|
|
3004
|
|
3005 hashTableIterInit(&iter, &(oldDtd->elementTypes));
|
|
3006
|
|
3007 for (;;) {
|
|
3008 int i;
|
|
3009 ELEMENT_TYPE *newE;
|
|
3010 const XML_Char *name;
|
|
3011 const ELEMENT_TYPE *oldE = (ELEMENT_TYPE *)hashTableIterNext(&iter);
|
|
3012 if (!oldE)
|
|
3013 break;
|
|
3014 name = poolCopyString(&(newDtd->pool), oldE->name);
|
|
3015 if (!name)
|
|
3016 return 0;
|
|
3017 newE = (ELEMENT_TYPE *)lookup(&(newDtd->elementTypes), name, sizeof(ELEMENT_TYPE));
|
|
3018 if (!newE)
|
|
3019 return 0;
|
|
3020 if (oldE->nDefaultAtts) {
|
|
3021 newE->defaultAtts = (DEFAULT_ATTRIBUTE *)malloc(oldE->nDefaultAtts * sizeof(DEFAULT_ATTRIBUTE));
|
|
3022 if (!newE->defaultAtts)
|
|
3023 return 0;
|
|
3024 }
|
|
3025 newE->allocDefaultAtts = newE->nDefaultAtts = oldE->nDefaultAtts;
|
|
3026 if (oldE->prefix)
|
|
3027 newE->prefix = (PREFIX *)lookup(&(newDtd->prefixes), oldE->prefix->name, 0);
|
|
3028 for (i = 0; i < newE->nDefaultAtts; i++) {
|
|
3029 newE->defaultAtts[i].id = (ATTRIBUTE_ID *)lookup(&(newDtd->attributeIds), oldE->defaultAtts[i].id->name, 0);
|
|
3030 newE->defaultAtts[i].isCdata = oldE->defaultAtts[i].isCdata;
|
|
3031 if (oldE->defaultAtts[i].value) {
|
|
3032 newE->defaultAtts[i].value = poolCopyString(&(newDtd->pool), oldE->defaultAtts[i].value);
|
|
3033 if (!newE->defaultAtts[i].value)
|
|
3034 return 0;
|
|
3035 }
|
|
3036 else
|
|
3037 newE->defaultAtts[i].value = 0;
|
|
3038 }
|
|
3039 }
|
|
3040
|
|
3041 /* Copy the entity table. */
|
|
3042
|
|
3043 hashTableIterInit(&iter, &(oldDtd->generalEntities));
|
|
3044
|
|
3045 for (;;) {
|
|
3046 ENTITY *newE;
|
|
3047 const XML_Char *name;
|
|
3048 const ENTITY *oldE = (ENTITY *)hashTableIterNext(&iter);
|
|
3049 if (!oldE)
|
|
3050 break;
|
|
3051 name = poolCopyString(&(newDtd->pool), oldE->name);
|
|
3052 if (!name)
|
|
3053 return 0;
|
|
3054 newE = (ENTITY *)lookup(&(newDtd->generalEntities), name, sizeof(ENTITY));
|
|
3055 if (!newE)
|
|
3056 return 0;
|
|
3057 if (oldE->systemId) {
|
|
3058 const XML_Char *tem = poolCopyString(&(newDtd->pool), oldE->systemId);
|
|
3059 if (!tem)
|
|
3060 return 0;
|
|
3061 newE->systemId = tem;
|
|
3062 if (oldE->base) {
|
|
3063 if (oldE->base == oldDtd->base)
|
|
3064 newE->base = newDtd->base;
|
|
3065 tem = poolCopyString(&(newDtd->pool), oldE->base);
|
|
3066 if (!tem)
|
|
3067 return 0;
|
|
3068 newE->base = tem;
|
|
3069 }
|
|
3070 }
|
|
3071 else {
|
|
3072 const XML_Char *tem = poolCopyStringN(&(newDtd->pool), oldE->textPtr, oldE->textLen);
|
|
3073 if (!tem)
|
|
3074 return 0;
|
|
3075 newE->textPtr = tem;
|
|
3076 newE->textLen = oldE->textLen;
|
|
3077 }
|
|
3078 if (oldE->notation) {
|
|
3079 const XML_Char *tem = poolCopyString(&(newDtd->pool), oldE->notation);
|
|
3080 if (!tem)
|
|
3081 return 0;
|
|
3082 newE->notation = tem;
|
|
3083 }
|
|
3084 }
|
|
3085
|
|
3086 newDtd->complete = oldDtd->complete;
|
|
3087 newDtd->standalone = oldDtd->standalone;
|
|
3088 return 1;
|
|
3089 }
|
|
3090
|
|
3091 static
|
|
3092 void poolInit(STRING_POOL *pool)
|
|
3093 {
|
|
3094 pool->blocks = 0;
|
|
3095 pool->freeBlocks = 0;
|
|
3096 pool->start = 0;
|
|
3097 pool->ptr = 0;
|
|
3098 pool->end = 0;
|
|
3099 }
|
|
3100
|
|
3101 static
|
|
3102 void poolClear(STRING_POOL *pool)
|
|
3103 {
|
|
3104 if (!pool->freeBlocks)
|
|
3105 pool->freeBlocks = pool->blocks;
|
|
3106 else {
|
|
3107 BLOCK *p = pool->blocks;
|
|
3108 while (p) {
|
|
3109 BLOCK *tem = p->next;
|
|
3110 p->next = pool->freeBlocks;
|
|
3111 pool->freeBlocks = p;
|
|
3112 p = tem;
|
|
3113 }
|
|
3114 }
|
|
3115 pool->blocks = 0;
|
|
3116 pool->start = 0;
|
|
3117 pool->ptr = 0;
|
|
3118 pool->end = 0;
|
|
3119 }
|
|
3120
|
|
3121 static
|
|
3122 void poolDestroy(STRING_POOL *pool)
|
|
3123 {
|
|
3124 BLOCK *p = pool->blocks;
|
|
3125 while (p) {
|
|
3126 BLOCK *tem = p->next;
|
|
3127 free(p);
|
|
3128 p = tem;
|
|
3129 }
|
|
3130 pool->blocks = 0;
|
|
3131 p = pool->freeBlocks;
|
|
3132 while (p) {
|
|
3133 BLOCK *tem = p->next;
|
|
3134 free(p);
|
|
3135 p = tem;
|
|
3136 }
|
|
3137 pool->freeBlocks = 0;
|
|
3138 pool->ptr = 0;
|
|
3139 pool->start = 0;
|
|
3140 pool->end = 0;
|
|
3141 }
|
|
3142
|
|
3143 static
|
|
3144 XML_Char *poolAppend(STRING_POOL *pool, const ENCODING *enc,
|
|
3145 const char *ptr, const char *end)
|
|
3146 {
|
|
3147 if (!pool->ptr && !poolGrow(pool))
|
|
3148 return 0;
|
|
3149 for (;;) {
|
|
3150 XmlConvert(enc, &ptr, end, (ICHAR **)&(pool->ptr), (ICHAR *)pool->end);
|
|
3151 if (ptr == end)
|
|
3152 break;
|
|
3153 if (!poolGrow(pool))
|
|
3154 return 0;
|
|
3155 }
|
|
3156 return pool->start;
|
|
3157 }
|
|
3158
|
|
3159 static const XML_Char *poolCopyString(STRING_POOL *pool, const XML_Char *s)
|
|
3160 {
|
|
3161 do {
|
|
3162 if (!poolAppendChar(pool, *s))
|
|
3163 return 0;
|
|
3164 } while (*s++);
|
|
3165 s = pool->start;
|
|
3166 poolFinish(pool);
|
|
3167 return s;
|
|
3168 }
|
|
3169
|
|
3170 static const XML_Char *poolCopyStringN(STRING_POOL *pool, const XML_Char *s, int n)
|
|
3171 {
|
|
3172 if (!pool->ptr && !poolGrow(pool))
|
|
3173 return 0;
|
|
3174 for (; n > 0; --n, s++) {
|
|
3175 if (!poolAppendChar(pool, *s))
|
|
3176 return 0;
|
|
3177
|
|
3178 }
|
|
3179 s = pool->start;
|
|
3180 poolFinish(pool);
|
|
3181 return s;
|
|
3182 }
|
|
3183
|
|
3184 static
|
|
3185 XML_Char *poolStoreString(STRING_POOL *pool, const ENCODING *enc,
|
|
3186 const char *ptr, const char *end)
|
|
3187 {
|
|
3188 if (!poolAppend(pool, enc, ptr, end))
|
|
3189 return 0;
|
|
3190 if (pool->ptr == pool->end && !poolGrow(pool))
|
|
3191 return 0;
|
|
3192 *(pool->ptr)++ = 0;
|
|
3193 return pool->start;
|
|
3194 }
|
|
3195
|
|
3196 static
|
|
3197 int poolGrow(STRING_POOL *pool)
|
|
3198 {
|
|
3199 if (pool->freeBlocks) {
|
|
3200 if (pool->start == 0) {
|
|
3201 pool->blocks = pool->freeBlocks;
|
|
3202 pool->freeBlocks = pool->freeBlocks->next;
|
|
3203 pool->blocks->next = 0;
|
|
3204 pool->start = pool->blocks->s;
|
|
3205 pool->end = pool->start + pool->blocks->size;
|
|
3206 pool->ptr = pool->start;
|
|
3207 return 1;
|
|
3208 }
|
|
3209 if (pool->end - pool->start < pool->freeBlocks->size) {
|
|
3210 BLOCK *tem = pool->freeBlocks->next;
|
|
3211 pool->freeBlocks->next = pool->blocks;
|
|
3212 pool->blocks = pool->freeBlocks;
|
|
3213 pool->freeBlocks = tem;
|
|
3214 memcpy(pool->blocks->s, pool->start, (pool->end - pool->start) * sizeof(XML_Char));
|
|
3215 pool->ptr = pool->blocks->s + (pool->ptr - pool->start);
|
|
3216 pool->start = pool->blocks->s;
|
|
3217 pool->end = pool->start + pool->blocks->size;
|
|
3218 return 1;
|
|
3219 }
|
|
3220 }
|
|
3221 if (pool->blocks && pool->start == pool->blocks->s) {
|
|
3222 int blockSize = (pool->end - pool->start)*2;
|
|
3223 pool->blocks = realloc(pool->blocks, offsetof(BLOCK, s) + blockSize * sizeof(XML_Char));
|
|
3224 if (!pool->blocks)
|
|
3225 return 0;
|
|
3226 pool->blocks->size = blockSize;
|
|
3227 pool->ptr = pool->blocks->s + (pool->ptr - pool->start);
|
|
3228 pool->start = pool->blocks->s;
|
|
3229 pool->end = pool->start + blockSize;
|
|
3230 }
|
|
3231 else {
|
|
3232 BLOCK *tem;
|
|
3233 int blockSize = pool->end - pool->start;
|
|
3234 if (blockSize < INIT_BLOCK_SIZE)
|
|
3235 blockSize = INIT_BLOCK_SIZE;
|
|
3236 else
|
|
3237 blockSize *= 2;
|
|
3238 tem = malloc(offsetof(BLOCK, s) + blockSize * sizeof(XML_Char));
|
|
3239 if (!tem)
|
|
3240 return 0;
|
|
3241 tem->size = blockSize;
|
|
3242 tem->next = pool->blocks;
|
|
3243 pool->blocks = tem;
|
|
3244 memcpy(tem->s, pool->start, (pool->ptr - pool->start) * sizeof(XML_Char));
|
|
3245 pool->ptr = tem->s + (pool->ptr - pool->start);
|
|
3246 pool->start = tem->s;
|
|
3247 pool->end = tem->s + blockSize;
|
|
3248 }
|
|
3249 return 1;
|
|
3250 }
|