1/*
2 * SAX2.c : Default SAX2 handler to build a tree.
3 *
4 * See Copyright for the status of this software.
5 *
6 * Daniel Veillard <daniel@veillard.com>
7 */
8
9
10#define IN_LIBXML
11#include "libxml.h"
12#include <stdlib.h>
13#include <string.h>
14#include <limits.h>
15#include <libxml/xmlmemory.h>
16#include <libxml/tree.h>
17#include <libxml/parser.h>
18#include <libxml/parserInternals.h>
19#include <libxml/valid.h>
20#include <libxml/entities.h>
21#include <libxml/xmlerror.h>
22#include <libxml/debugXML.h>
23#include <libxml/xmlIO.h>
24#include <libxml/SAX.h>
25#include <libxml/uri.h>
26#include <libxml/valid.h>
27#include <libxml/HTMLtree.h>
28#include <libxml/globals.h>
29
30/* Define SIZE_T_MAX unless defined through <limits.h>. */
31#ifndef SIZE_T_MAX
32# define SIZE_T_MAX     ((size_t)-1)
33#endif /* !SIZE_T_MAX */
34
35/* #define DEBUG_SAX2 */
36/* #define DEBUG_SAX2_TREE */
37
38/**
39 * TODO:
40 *
41 * macro to flag unimplemented blocks
42 * XML_CATALOG_PREFER user env to select between system/public prefered
43 * option. C.f. Richard Tobin <richard@cogsci.ed.ac.uk>
44 *> Just FYI, I am using an environment variable XML_CATALOG_PREFER with
45 *> values "system" and "public".  I have made the default be "system" to
46 *> match yours.
47 */
48#define TODO								\
49    xmlGenericError(xmlGenericErrorContext,				\
50	    "Unimplemented block at %s:%d\n",				\
51            __FILE__, __LINE__);
52
53/*
54 * xmlSAX2ErrMemory:
55 * @ctxt:  an XML validation parser context
56 * @msg:   a string to accompany the error message
57 */
58static void
59xmlSAX2ErrMemory(xmlParserCtxtPtr ctxt, const char *msg) {
60    xmlStructuredErrorFunc schannel = NULL;
61    const char *str1 = "out of memory\n";
62
63    if (ctxt != NULL) {
64	ctxt->errNo = XML_ERR_NO_MEMORY;
65	if ((ctxt->sax != NULL) && (ctxt->sax->initialized == XML_SAX2_MAGIC))
66	    schannel = ctxt->sax->serror;
67	__xmlRaiseError(schannel,
68			ctxt->vctxt.error, ctxt->vctxt.userData,
69			ctxt, NULL, XML_FROM_PARSER, XML_ERR_NO_MEMORY,
70			XML_ERR_ERROR, NULL, 0, (const char *) str1,
71			NULL, NULL, 0, 0,
72			msg, (const char *) str1, NULL);
73	ctxt->errNo = XML_ERR_NO_MEMORY;
74	ctxt->instate = XML_PARSER_EOF;
75	ctxt->disableSAX = 1;
76    } else {
77	__xmlRaiseError(schannel,
78			NULL, NULL,
79			ctxt, NULL, XML_FROM_PARSER, XML_ERR_NO_MEMORY,
80			XML_ERR_ERROR, NULL, 0, (const char *) str1,
81			NULL, NULL, 0, 0,
82			msg, (const char *) str1, NULL);
83    }
84}
85
86/**
87 * xmlValidError:
88 * @ctxt:  an XML validation parser context
89 * @error:  the error number
90 * @msg:  the error message
91 * @str1:  extra data
92 * @str2:  extra data
93 *
94 * Handle a validation error
95 */
96static void
97xmlErrValid(xmlParserCtxtPtr ctxt, xmlParserErrors error,
98            const char *msg, const char *str1, const char *str2)
99{
100    xmlStructuredErrorFunc schannel = NULL;
101
102    if ((ctxt != NULL) && (ctxt->disableSAX != 0) &&
103        (ctxt->instate == XML_PARSER_EOF))
104	return;
105    if (ctxt != NULL) {
106	ctxt->errNo = error;
107	if ((ctxt->sax != NULL) && (ctxt->sax->initialized == XML_SAX2_MAGIC))
108	    schannel = ctxt->sax->serror;
109	__xmlRaiseError(schannel,
110			ctxt->vctxt.error, ctxt->vctxt.userData,
111			ctxt, NULL, XML_FROM_DTD, error,
112			XML_ERR_ERROR, NULL, 0, (const char *) str1,
113			(const char *) str2, NULL, 0, 0,
114			msg, (const char *) str1, (const char *) str2);
115	ctxt->valid = 0;
116    } else {
117	__xmlRaiseError(schannel,
118			NULL, NULL,
119			ctxt, NULL, XML_FROM_DTD, error,
120			XML_ERR_ERROR, NULL, 0, (const char *) str1,
121			(const char *) str2, NULL, 0, 0,
122			msg, (const char *) str1, (const char *) str2);
123    }
124}
125
126/**
127 * xmlFatalErrMsg:
128 * @ctxt:  an XML parser context
129 * @error:  the error number
130 * @msg:  the error message
131 * @str1:  an error string
132 * @str2:  an error string
133 *
134 * Handle a fatal parser error, i.e. violating Well-Formedness constraints
135 */
136static void
137xmlFatalErrMsg(xmlParserCtxtPtr ctxt, xmlParserErrors error,
138               const char *msg, const xmlChar *str1, const xmlChar *str2)
139{
140    if ((ctxt != NULL) && (ctxt->disableSAX != 0) &&
141        (ctxt->instate == XML_PARSER_EOF))
142	return;
143    if (ctxt != NULL)
144	ctxt->errNo = error;
145    __xmlRaiseError(NULL, NULL, NULL, ctxt, NULL, XML_FROM_PARSER, error,
146                    XML_ERR_FATAL, NULL, 0,
147		    (const char *) str1, (const char *) str2,
148		    NULL, 0, 0, msg, str1, str2);
149    if (ctxt != NULL) {
150	ctxt->wellFormed = 0;
151	ctxt->valid = 0;
152	if (ctxt->recovery == 0)
153	    ctxt->disableSAX = 1;
154    }
155}
156
157/**
158 * xmlWarnMsg:
159 * @ctxt:  an XML parser context
160 * @error:  the error number
161 * @msg:  the error message
162 * @str1:  an error string
163 * @str2:  an error string
164 *
165 * Handle a parser warning
166 */
167static void
168xmlWarnMsg(xmlParserCtxtPtr ctxt, xmlParserErrors error,
169               const char *msg, const xmlChar *str1)
170{
171    if ((ctxt != NULL) && (ctxt->disableSAX != 0) &&
172        (ctxt->instate == XML_PARSER_EOF))
173	return;
174    if (ctxt != NULL)
175	ctxt->errNo = error;
176    __xmlRaiseError(NULL, NULL, NULL, ctxt, NULL, XML_FROM_PARSER, error,
177                    XML_ERR_WARNING, NULL, 0,
178		    (const char *) str1, NULL,
179		    NULL, 0, 0, msg, str1);
180}
181
182/**
183 * xmlNsErrMsg:
184 * @ctxt:  an XML parser context
185 * @error:  the error number
186 * @msg:  the error message
187 * @str1:  an error string
188 * @str2:  an error string
189 *
190 * Handle a namespace error
191 */
192static void
193xmlNsErrMsg(xmlParserCtxtPtr ctxt, xmlParserErrors error,
194            const char *msg, const xmlChar *str1, const xmlChar *str2)
195{
196    if ((ctxt != NULL) && (ctxt->disableSAX != 0) &&
197        (ctxt->instate == XML_PARSER_EOF))
198	return;
199    if (ctxt != NULL)
200	ctxt->errNo = error;
201    __xmlRaiseError(NULL, NULL, NULL, ctxt, NULL, XML_FROM_NAMESPACE, error,
202                    XML_ERR_ERROR, NULL, 0,
203		    (const char *) str1, (const char *) str2,
204		    NULL, 0, 0, msg, str1, str2);
205}
206
207/**
208 * xmlNsWarnMsg:
209 * @ctxt:  an XML parser context
210 * @error:  the error number
211 * @msg:  the error message
212 * @str1:  an error string
213 *
214 * Handle a namespace warning
215 */
216static void
217xmlNsWarnMsg(xmlParserCtxtPtr ctxt, xmlParserErrors error,
218             const char *msg, const xmlChar *str1, const xmlChar *str2)
219{
220    if ((ctxt != NULL) && (ctxt->disableSAX != 0) &&
221        (ctxt->instate == XML_PARSER_EOF))
222	return;
223    if (ctxt != NULL)
224	ctxt->errNo = error;
225    __xmlRaiseError(NULL, NULL, NULL, ctxt, NULL, XML_FROM_NAMESPACE, error,
226                    XML_ERR_WARNING, NULL, 0,
227		    (const char *) str1, (const char *) str2,
228		    NULL, 0, 0, msg, str1, str2);
229}
230
231/**
232 * xmlSAX2GetPublicId:
233 * @ctx: the user data (XML parser context)
234 *
235 * Provides the public ID e.g. "-//SGMLSOURCE//DTD DEMO//EN"
236 *
237 * Returns a xmlChar *
238 */
239const xmlChar *
240xmlSAX2GetPublicId(void *ctx ATTRIBUTE_UNUSED)
241{
242    /* xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx; */
243    return(NULL);
244}
245
246/**
247 * xmlSAX2GetSystemId:
248 * @ctx: the user data (XML parser context)
249 *
250 * Provides the system ID, basically URL or filename e.g.
251 * http://www.sgmlsource.com/dtds/memo.dtd
252 *
253 * Returns a xmlChar *
254 */
255const xmlChar *
256xmlSAX2GetSystemId(void *ctx)
257{
258    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
259    if ((ctx == NULL) || (ctxt->input == NULL)) return(NULL);
260    return((const xmlChar *) ctxt->input->filename);
261}
262
263/**
264 * xmlSAX2GetLineNumber:
265 * @ctx: the user data (XML parser context)
266 *
267 * Provide the line number of the current parsing point.
268 *
269 * Returns an int
270 */
271int
272xmlSAX2GetLineNumber(void *ctx)
273{
274    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
275    if ((ctx == NULL) || (ctxt->input == NULL)) return(0);
276    return(ctxt->input->line);
277}
278
279/**
280 * xmlSAX2GetColumnNumber:
281 * @ctx: the user data (XML parser context)
282 *
283 * Provide the column number of the current parsing point.
284 *
285 * Returns an int
286 */
287int
288xmlSAX2GetColumnNumber(void *ctx)
289{
290    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
291    if ((ctx == NULL) || (ctxt->input == NULL)) return(0);
292    return(ctxt->input->col);
293}
294
295/**
296 * xmlSAX2IsStandalone:
297 * @ctx: the user data (XML parser context)
298 *
299 * Is this document tagged standalone ?
300 *
301 * Returns 1 if true
302 */
303int
304xmlSAX2IsStandalone(void *ctx)
305{
306    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
307    if ((ctx == NULL) || (ctxt->myDoc == NULL)) return(0);
308    return(ctxt->myDoc->standalone == 1);
309}
310
311/**
312 * xmlSAX2HasInternalSubset:
313 * @ctx: the user data (XML parser context)
314 *
315 * Does this document has an internal subset
316 *
317 * Returns 1 if true
318 */
319int
320xmlSAX2HasInternalSubset(void *ctx)
321{
322    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
323    if ((ctxt == NULL) || (ctxt->myDoc == NULL)) return(0);
324    return(ctxt->myDoc->intSubset != NULL);
325}
326
327/**
328 * xmlSAX2HasExternalSubset:
329 * @ctx: the user data (XML parser context)
330 *
331 * Does this document has an external subset
332 *
333 * Returns 1 if true
334 */
335int
336xmlSAX2HasExternalSubset(void *ctx)
337{
338    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
339    if ((ctxt == NULL) || (ctxt->myDoc == NULL)) return(0);
340    return(ctxt->myDoc->extSubset != NULL);
341}
342
343/**
344 * xmlSAX2InternalSubset:
345 * @ctx:  the user data (XML parser context)
346 * @name:  the root element name
347 * @ExternalID:  the external ID
348 * @SystemID:  the SYSTEM ID (e.g. filename or URL)
349 *
350 * Callback on internal subset declaration.
351 */
352void
353xmlSAX2InternalSubset(void *ctx, const xmlChar *name,
354	       const xmlChar *ExternalID, const xmlChar *SystemID)
355{
356    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
357    xmlDtdPtr dtd;
358    if (ctx == NULL) return;
359#ifdef DEBUG_SAX
360    xmlGenericError(xmlGenericErrorContext,
361	    "SAX.xmlSAX2InternalSubset(%s, %s, %s)\n",
362            name, ExternalID, SystemID);
363#endif
364
365    if (ctxt->myDoc == NULL)
366	return;
367    dtd = xmlGetIntSubset(ctxt->myDoc);
368    if (dtd != NULL) {
369	if (ctxt->html)
370	    return;
371	xmlUnlinkNode((xmlNodePtr) dtd);
372	xmlFreeDtd(dtd);
373	ctxt->myDoc->intSubset = NULL;
374    }
375    ctxt->myDoc->intSubset =
376	xmlCreateIntSubset(ctxt->myDoc, name, ExternalID, SystemID);
377    if (ctxt->myDoc->intSubset == NULL)
378        xmlSAX2ErrMemory(ctxt, "xmlSAX2InternalSubset");
379}
380
381/**
382 * xmlSAX2ExternalSubset:
383 * @ctx: the user data (XML parser context)
384 * @name:  the root element name
385 * @ExternalID:  the external ID
386 * @SystemID:  the SYSTEM ID (e.g. filename or URL)
387 *
388 * Callback on external subset declaration.
389 */
390void
391xmlSAX2ExternalSubset(void *ctx, const xmlChar *name,
392	       const xmlChar *ExternalID, const xmlChar *SystemID)
393{
394    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
395    if (ctx == NULL) return;
396#ifdef DEBUG_SAX
397    xmlGenericError(xmlGenericErrorContext,
398	    "SAX.xmlSAX2ExternalSubset(%s, %s, %s)\n",
399            name, ExternalID, SystemID);
400#endif
401    if (((ExternalID != NULL) || (SystemID != NULL)) &&
402        (((ctxt->validate) || (ctxt->loadsubset != 0)) &&
403	 (ctxt->wellFormed && ctxt->myDoc))) {
404	/*
405	 * Try to fetch and parse the external subset.
406	 */
407	xmlParserInputPtr oldinput;
408	int oldinputNr;
409	int oldinputMax;
410	xmlParserInputPtr *oldinputTab;
411	xmlParserInputPtr input = NULL;
412	xmlCharEncoding enc;
413	int oldcharset;
414	const xmlChar *oldencoding;
415
416	/*
417	 * Ask the Entity resolver to load the damn thing
418	 */
419	if ((ctxt->sax != NULL) && (ctxt->sax->resolveEntity != NULL))
420	    input = ctxt->sax->resolveEntity(ctxt->userData, ExternalID,
421	                                        SystemID);
422	if (input == NULL) {
423	    return;
424	}
425
426	xmlNewDtd(ctxt->myDoc, name, ExternalID, SystemID);
427
428	/*
429	 * make sure we won't destroy the main document context
430	 */
431	oldinput = ctxt->input;
432	oldinputNr = ctxt->inputNr;
433	oldinputMax = ctxt->inputMax;
434	oldinputTab = ctxt->inputTab;
435	oldcharset = ctxt->charset;
436	oldencoding = ctxt->encoding;
437	ctxt->encoding = NULL;
438
439	ctxt->inputTab = (xmlParserInputPtr *)
440	                 xmlMalloc(5 * sizeof(xmlParserInputPtr));
441	if (ctxt->inputTab == NULL) {
442	    xmlSAX2ErrMemory(ctxt, "xmlSAX2ExternalSubset");
443	    ctxt->input = oldinput;
444	    ctxt->inputNr = oldinputNr;
445	    ctxt->inputMax = oldinputMax;
446	    ctxt->inputTab = oldinputTab;
447	    ctxt->charset = oldcharset;
448	    ctxt->encoding = oldencoding;
449	    return;
450	}
451	ctxt->inputNr = 0;
452	ctxt->inputMax = 5;
453	ctxt->input = NULL;
454	xmlPushInput(ctxt, input);
455
456	/*
457	 * On the fly encoding conversion if needed
458	 */
459	if (ctxt->input->length >= 4) {
460	    enc = xmlDetectCharEncoding(ctxt->input->cur, 4);
461	    xmlSwitchEncoding(ctxt, enc);
462	}
463
464	if (input->filename == NULL)
465	    input->filename = (char *) xmlCanonicPath(SystemID);
466	input->line = 1;
467	input->col = 1;
468	input->base = ctxt->input->cur;
469	input->cur = ctxt->input->cur;
470	input->free = NULL;
471
472	/*
473	 * let's parse that entity knowing it's an external subset.
474	 */
475	xmlParseExternalSubset(ctxt, ExternalID, SystemID);
476
477        /*
478	 * Free up the external entities
479	 */
480
481	while (ctxt->inputNr > 1)
482	    xmlPopInput(ctxt);
483	xmlFreeInputStream(ctxt->input);
484        xmlFree(ctxt->inputTab);
485
486	/*
487	 * Restore the parsing context of the main entity
488	 */
489	ctxt->input = oldinput;
490	ctxt->inputNr = oldinputNr;
491	ctxt->inputMax = oldinputMax;
492	ctxt->inputTab = oldinputTab;
493	ctxt->charset = oldcharset;
494	if ((ctxt->encoding != NULL) &&
495	    ((ctxt->dict == NULL) ||
496	     (!xmlDictOwns(ctxt->dict, ctxt->encoding))))
497	    xmlFree((xmlChar *) ctxt->encoding);
498	ctxt->encoding = oldencoding;
499	/* ctxt->wellFormed = oldwellFormed; */
500    }
501}
502
503/**
504 * xmlSAX2ResolveEntity:
505 * @ctx: the user data (XML parser context)
506 * @publicId: The public ID of the entity
507 * @systemId: The system ID of the entity
508 *
509 * The entity loader, to control the loading of external entities,
510 * the application can either:
511 *    - override this xmlSAX2ResolveEntity() callback in the SAX block
512 *    - or better use the xmlSetExternalEntityLoader() function to
513 *      set up it's own entity resolution routine
514 *
515 * Returns the xmlParserInputPtr if inlined or NULL for DOM behaviour.
516 */
517xmlParserInputPtr
518xmlSAX2ResolveEntity(void *ctx, const xmlChar *publicId, const xmlChar *systemId)
519{
520    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
521    xmlParserInputPtr ret;
522    xmlChar *URI;
523    const char *base = NULL;
524
525    if (ctx == NULL) return(NULL);
526    if (ctxt->input != NULL)
527	base = ctxt->input->filename;
528    if (base == NULL)
529	base = ctxt->directory;
530
531    URI = xmlBuildURI(systemId, (const xmlChar *) base);
532
533#ifdef DEBUG_SAX
534    xmlGenericError(xmlGenericErrorContext,
535	    "SAX.xmlSAX2ResolveEntity(%s, %s)\n", publicId, systemId);
536#endif
537
538    ret = xmlLoadExternalEntity((const char *) URI,
539				(const char *) publicId, ctxt);
540    if (URI != NULL)
541	xmlFree(URI);
542    return(ret);
543}
544
545/**
546 * xmlSAX2GetEntity:
547 * @ctx: the user data (XML parser context)
548 * @name: The entity name
549 *
550 * Get an entity by name
551 *
552 * Returns the xmlEntityPtr if found.
553 */
554xmlEntityPtr
555xmlSAX2GetEntity(void *ctx, const xmlChar *name)
556{
557    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
558    xmlEntityPtr ret = NULL;
559
560    if (ctx == NULL) return(NULL);
561#ifdef DEBUG_SAX
562    xmlGenericError(xmlGenericErrorContext,
563	    "SAX.xmlSAX2GetEntity(%s)\n", name);
564#endif
565
566    if (ctxt->inSubset == 0) {
567	ret = xmlGetPredefinedEntity(name);
568	if (ret != NULL)
569	    return(ret);
570    }
571    if ((ctxt->myDoc != NULL) && (ctxt->myDoc->standalone == 1)) {
572	if (ctxt->inSubset == 2) {
573	    ctxt->myDoc->standalone = 0;
574	    ret = xmlGetDocEntity(ctxt->myDoc, name);
575	    ctxt->myDoc->standalone = 1;
576	} else {
577	    ret = xmlGetDocEntity(ctxt->myDoc, name);
578	    if (ret == NULL) {
579		ctxt->myDoc->standalone = 0;
580		ret = xmlGetDocEntity(ctxt->myDoc, name);
581		if (ret != NULL) {
582		    xmlFatalErrMsg(ctxt, XML_ERR_NOT_STANDALONE,
583	 "Entity(%s) document marked standalone but requires external subset\n",
584				   name, NULL);
585		}
586		ctxt->myDoc->standalone = 1;
587	    }
588	}
589    } else {
590	ret = xmlGetDocEntity(ctxt->myDoc, name);
591    }
592    if ((ret != NULL) &&
593	((ctxt->validate) || (ctxt->replaceEntities)) &&
594	(ret->children == NULL) &&
595	(ret->etype == XML_EXTERNAL_GENERAL_PARSED_ENTITY)) {
596	int val;
597
598	/*
599	 * for validation purposes we really need to fetch and
600	 * parse the external entity
601	 */
602	xmlNodePtr children;
603	unsigned long oldnbent = ctxt->nbentities;
604
605        val = xmlParseCtxtExternalEntity(ctxt, ret->URI,
606		                         ret->ExternalID, &children);
607	if (val == 0) {
608	    xmlAddChildList((xmlNodePtr) ret, children);
609	} else {
610	    xmlFatalErrMsg(ctxt, XML_ERR_ENTITY_PROCESSING,
611		           "Failure to process entity %s\n", name, NULL);
612	    ctxt->validate = 0;
613	    return(NULL);
614	}
615	ret->owner = 1;
616	if (ret->checked == 0) {
617	    ret->checked = (ctxt->nbentities - oldnbent + 1) * 2;
618	    if ((ret->content != NULL) && (xmlStrchr(ret->content, '<')))
619	        ret->checked |= 1;
620	}
621    }
622    return(ret);
623}
624
625/**
626 * xmlSAX2GetParameterEntity:
627 * @ctx: the user data (XML parser context)
628 * @name: The entity name
629 *
630 * Get a parameter entity by name
631 *
632 * Returns the xmlEntityPtr if found.
633 */
634xmlEntityPtr
635xmlSAX2GetParameterEntity(void *ctx, const xmlChar *name)
636{
637    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
638    xmlEntityPtr ret;
639
640    if (ctx == NULL) return(NULL);
641#ifdef DEBUG_SAX
642    xmlGenericError(xmlGenericErrorContext,
643	    "SAX.xmlSAX2GetParameterEntity(%s)\n", name);
644#endif
645
646    ret = xmlGetParameterEntity(ctxt->myDoc, name);
647    return(ret);
648}
649
650
651/**
652 * xmlSAX2EntityDecl:
653 * @ctx: the user data (XML parser context)
654 * @name:  the entity name
655 * @type:  the entity type
656 * @publicId: The public ID of the entity
657 * @systemId: The system ID of the entity
658 * @content: the entity value (without processing).
659 *
660 * An entity definition has been parsed
661 */
662void
663xmlSAX2EntityDecl(void *ctx, const xmlChar *name, int type,
664          const xmlChar *publicId, const xmlChar *systemId, xmlChar *content)
665{
666    xmlEntityPtr ent;
667    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
668
669    if (ctx == NULL) return;
670#ifdef DEBUG_SAX
671    xmlGenericError(xmlGenericErrorContext,
672	    "SAX.xmlSAX2EntityDecl(%s, %d, %s, %s, %s)\n",
673            name, type, publicId, systemId, content);
674#endif
675    if (ctxt->inSubset == 1) {
676	ent = xmlAddDocEntity(ctxt->myDoc, name, type, publicId,
677		              systemId, content);
678	if ((ent == NULL) && (ctxt->pedantic))
679	    xmlWarnMsg(ctxt, XML_WAR_ENTITY_REDEFINED,
680	     "Entity(%s) already defined in the internal subset\n",
681	               name);
682	if ((ent != NULL) && (ent->URI == NULL) && (systemId != NULL)) {
683	    xmlChar *URI;
684	    const char *base = NULL;
685
686	    if (ctxt->input != NULL)
687		base = ctxt->input->filename;
688	    if (base == NULL)
689		base = ctxt->directory;
690
691	    URI = xmlBuildURI(systemId, (const xmlChar *) base);
692	    ent->URI = URI;
693	}
694    } else if (ctxt->inSubset == 2) {
695	ent = xmlAddDtdEntity(ctxt->myDoc, name, type, publicId,
696		              systemId, content);
697	if ((ent == NULL) && (ctxt->pedantic) &&
698	    (ctxt->sax != NULL) && (ctxt->sax->warning != NULL))
699	    ctxt->sax->warning(ctxt->userData,
700	     "Entity(%s) already defined in the external subset\n", name);
701	if ((ent != NULL) && (ent->URI == NULL) && (systemId != NULL)) {
702	    xmlChar *URI;
703	    const char *base = NULL;
704
705	    if (ctxt->input != NULL)
706		base = ctxt->input->filename;
707	    if (base == NULL)
708		base = ctxt->directory;
709
710	    URI = xmlBuildURI(systemId, (const xmlChar *) base);
711	    ent->URI = URI;
712	}
713    } else {
714	xmlFatalErrMsg(ctxt, XML_ERR_ENTITY_PROCESSING,
715	               "SAX.xmlSAX2EntityDecl(%s) called while not in subset\n",
716		       name, NULL);
717    }
718}
719
720/**
721 * xmlSAX2AttributeDecl:
722 * @ctx: the user data (XML parser context)
723 * @elem:  the name of the element
724 * @fullname:  the attribute name
725 * @type:  the attribute type
726 * @def:  the type of default value
727 * @defaultValue: the attribute default value
728 * @tree:  the tree of enumerated value set
729 *
730 * An attribute definition has been parsed
731 */
732void
733xmlSAX2AttributeDecl(void *ctx, const xmlChar *elem, const xmlChar *fullname,
734              int type, int def, const xmlChar *defaultValue,
735	      xmlEnumerationPtr tree)
736{
737    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
738    xmlAttributePtr attr;
739    xmlChar *name = NULL, *prefix = NULL;
740
741    if ((ctxt == NULL) || (ctxt->myDoc == NULL))
742        return;
743
744#ifdef DEBUG_SAX
745    xmlGenericError(xmlGenericErrorContext,
746	    "SAX.xmlSAX2AttributeDecl(%s, %s, %d, %d, %s, ...)\n",
747            elem, fullname, type, def, defaultValue);
748#endif
749    if ((xmlStrEqual(fullname, BAD_CAST "xml:id")) &&
750        (type != XML_ATTRIBUTE_ID)) {
751	/*
752	 * Raise the error but keep the validity flag
753	 */
754	int tmp = ctxt->valid;
755	xmlErrValid(ctxt, XML_DTD_XMLID_TYPE,
756	      "xml:id : attribute type should be ID\n", NULL, NULL);
757	ctxt->valid = tmp;
758    }
759    /* TODO: optimize name/prefix allocation */
760    name = xmlSplitQName(ctxt, fullname, &prefix);
761    ctxt->vctxt.valid = 1;
762    if (ctxt->inSubset == 1)
763	attr = xmlAddAttributeDecl(&ctxt->vctxt, ctxt->myDoc->intSubset, elem,
764	       name, prefix, (xmlAttributeType) type,
765	       (xmlAttributeDefault) def, defaultValue, tree);
766    else if (ctxt->inSubset == 2)
767	attr = xmlAddAttributeDecl(&ctxt->vctxt, ctxt->myDoc->extSubset, elem,
768	   name, prefix, (xmlAttributeType) type,
769	   (xmlAttributeDefault) def, defaultValue, tree);
770    else {
771        xmlFatalErrMsg(ctxt, XML_ERR_INTERNAL_ERROR,
772	     "SAX.xmlSAX2AttributeDecl(%s) called while not in subset\n",
773	               name, NULL);
774	xmlFreeEnumeration(tree);
775	return;
776    }
777#ifdef LIBXML_VALID_ENABLED
778    if (ctxt->vctxt.valid == 0)
779	ctxt->valid = 0;
780    if ((attr != NULL) && (ctxt->validate) && (ctxt->wellFormed) &&
781        (ctxt->myDoc->intSubset != NULL))
782	ctxt->valid &= xmlValidateAttributeDecl(&ctxt->vctxt, ctxt->myDoc,
783	                                        attr);
784#endif /* LIBXML_VALID_ENABLED */
785    if (prefix != NULL)
786	xmlFree(prefix);
787    if (name != NULL)
788	xmlFree(name);
789}
790
791/**
792 * xmlSAX2ElementDecl:
793 * @ctx: the user data (XML parser context)
794 * @name:  the element name
795 * @type:  the element type
796 * @content: the element value tree
797 *
798 * An element definition has been parsed
799 */
800void
801xmlSAX2ElementDecl(void *ctx, const xmlChar * name, int type,
802            xmlElementContentPtr content)
803{
804    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
805    xmlElementPtr elem = NULL;
806
807    if ((ctxt == NULL) || (ctxt->myDoc == NULL))
808        return;
809
810#ifdef DEBUG_SAX
811    xmlGenericError(xmlGenericErrorContext,
812                    "SAX.xmlSAX2ElementDecl(%s, %d, ...)\n", name, type);
813#endif
814
815    if (ctxt->inSubset == 1)
816        elem = xmlAddElementDecl(&ctxt->vctxt, ctxt->myDoc->intSubset,
817                                 name, (xmlElementTypeVal) type, content);
818    else if (ctxt->inSubset == 2)
819        elem = xmlAddElementDecl(&ctxt->vctxt, ctxt->myDoc->extSubset,
820                                 name, (xmlElementTypeVal) type, content);
821    else {
822        xmlFatalErrMsg(ctxt, XML_ERR_INTERNAL_ERROR,
823	     "SAX.xmlSAX2ElementDecl(%s) called while not in subset\n",
824	               name, NULL);
825        return;
826    }
827#ifdef LIBXML_VALID_ENABLED
828    if (elem == NULL)
829        ctxt->valid = 0;
830    if (ctxt->validate && ctxt->wellFormed &&
831        ctxt->myDoc && ctxt->myDoc->intSubset)
832        ctxt->valid &=
833            xmlValidateElementDecl(&ctxt->vctxt, ctxt->myDoc, elem);
834#endif /* LIBXML_VALID_ENABLED */
835}
836
837/**
838 * xmlSAX2NotationDecl:
839 * @ctx: the user data (XML parser context)
840 * @name: The name of the notation
841 * @publicId: The public ID of the entity
842 * @systemId: The system ID of the entity
843 *
844 * What to do when a notation declaration has been parsed.
845 */
846void
847xmlSAX2NotationDecl(void *ctx, const xmlChar *name,
848	     const xmlChar *publicId, const xmlChar *systemId)
849{
850    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
851    xmlNotationPtr nota = NULL;
852
853    if ((ctxt == NULL) || (ctxt->myDoc == NULL))
854        return;
855
856#ifdef DEBUG_SAX
857    xmlGenericError(xmlGenericErrorContext,
858	    "SAX.xmlSAX2NotationDecl(%s, %s, %s)\n", name, publicId, systemId);
859#endif
860
861    if ((publicId == NULL) && (systemId == NULL)) {
862	xmlFatalErrMsg(ctxt, XML_ERR_NOTATION_PROCESSING,
863	     "SAX.xmlSAX2NotationDecl(%s) externalID or PublicID missing\n",
864	               name, NULL);
865	return;
866    } else if (ctxt->inSubset == 1)
867	nota = xmlAddNotationDecl(&ctxt->vctxt, ctxt->myDoc->intSubset, name,
868                              publicId, systemId);
869    else if (ctxt->inSubset == 2)
870	nota = xmlAddNotationDecl(&ctxt->vctxt, ctxt->myDoc->extSubset, name,
871                              publicId, systemId);
872    else {
873	xmlFatalErrMsg(ctxt, XML_ERR_NOTATION_PROCESSING,
874	     "SAX.xmlSAX2NotationDecl(%s) called while not in subset\n",
875	               name, NULL);
876	return;
877    }
878#ifdef LIBXML_VALID_ENABLED
879    if (nota == NULL) ctxt->valid = 0;
880    if ((ctxt->validate) && (ctxt->wellFormed) &&
881        (ctxt->myDoc->intSubset != NULL))
882	ctxt->valid &= xmlValidateNotationDecl(&ctxt->vctxt, ctxt->myDoc,
883	                                       nota);
884#endif /* LIBXML_VALID_ENABLED */
885}
886
887/**
888 * xmlSAX2UnparsedEntityDecl:
889 * @ctx: the user data (XML parser context)
890 * @name: The name of the entity
891 * @publicId: The public ID of the entity
892 * @systemId: The system ID of the entity
893 * @notationName: the name of the notation
894 *
895 * What to do when an unparsed entity declaration is parsed
896 */
897void
898xmlSAX2UnparsedEntityDecl(void *ctx, const xmlChar *name,
899		   const xmlChar *publicId, const xmlChar *systemId,
900		   const xmlChar *notationName)
901{
902    xmlEntityPtr ent;
903    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
904    if (ctx == NULL) return;
905#ifdef DEBUG_SAX
906    xmlGenericError(xmlGenericErrorContext,
907	    "SAX.xmlSAX2UnparsedEntityDecl(%s, %s, %s, %s)\n",
908            name, publicId, systemId, notationName);
909#endif
910    if (ctxt->inSubset == 1) {
911	ent = xmlAddDocEntity(ctxt->myDoc, name,
912			XML_EXTERNAL_GENERAL_UNPARSED_ENTITY,
913			publicId, systemId, notationName);
914	if ((ent == NULL) && (ctxt->pedantic) &&
915	    (ctxt->sax != NULL) && (ctxt->sax->warning != NULL))
916	    ctxt->sax->warning(ctxt->userData,
917	     "Entity(%s) already defined in the internal subset\n", name);
918	if ((ent != NULL) && (ent->URI == NULL) && (systemId != NULL)) {
919	    xmlChar *URI;
920	    const char *base = NULL;
921
922	    if (ctxt->input != NULL)
923		base = ctxt->input->filename;
924	    if (base == NULL)
925		base = ctxt->directory;
926
927	    URI = xmlBuildURI(systemId, (const xmlChar *) base);
928	    ent->URI = URI;
929	}
930    } else if (ctxt->inSubset == 2) {
931	ent = xmlAddDtdEntity(ctxt->myDoc, name,
932			XML_EXTERNAL_GENERAL_UNPARSED_ENTITY,
933			publicId, systemId, notationName);
934	if ((ent == NULL) && (ctxt->pedantic) &&
935	    (ctxt->sax != NULL) && (ctxt->sax->warning != NULL))
936	    ctxt->sax->warning(ctxt->userData,
937	     "Entity(%s) already defined in the external subset\n", name);
938	if ((ent != NULL) && (ent->URI == NULL) && (systemId != NULL)) {
939	    xmlChar *URI;
940	    const char *base = NULL;
941
942	    if (ctxt->input != NULL)
943		base = ctxt->input->filename;
944	    if (base == NULL)
945		base = ctxt->directory;
946
947	    URI = xmlBuildURI(systemId, (const xmlChar *) base);
948	    ent->URI = URI;
949	}
950    } else {
951        xmlFatalErrMsg(ctxt, XML_ERR_INTERNAL_ERROR,
952	     "SAX.xmlSAX2UnparsedEntityDecl(%s) called while not in subset\n",
953	               name, NULL);
954    }
955}
956
957/**
958 * xmlSAX2SetDocumentLocator:
959 * @ctx: the user data (XML parser context)
960 * @loc: A SAX Locator
961 *
962 * Receive the document locator at startup, actually xmlDefaultSAXLocator
963 * Everything is available on the context, so this is useless in our case.
964 */
965void
966xmlSAX2SetDocumentLocator(void *ctx ATTRIBUTE_UNUSED, xmlSAXLocatorPtr loc ATTRIBUTE_UNUSED)
967{
968    /* xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx; */
969#ifdef DEBUG_SAX
970    xmlGenericError(xmlGenericErrorContext,
971	    "SAX.xmlSAX2SetDocumentLocator()\n");
972#endif
973}
974
975/**
976 * xmlSAX2StartDocument:
977 * @ctx: the user data (XML parser context)
978 *
979 * called when the document start being processed.
980 */
981void
982xmlSAX2StartDocument(void *ctx)
983{
984    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
985    xmlDocPtr doc;
986
987    if (ctx == NULL) return;
988
989#ifdef DEBUG_SAX
990    xmlGenericError(xmlGenericErrorContext,
991	    "SAX.xmlSAX2StartDocument()\n");
992#endif
993    if (ctxt->html) {
994#ifdef LIBXML_HTML_ENABLED
995	if (ctxt->myDoc == NULL)
996	    ctxt->myDoc = htmlNewDocNoDtD(NULL, NULL);
997	ctxt->myDoc->properties = XML_DOC_HTML;
998	ctxt->myDoc->parseFlags = ctxt->options;
999	if (ctxt->myDoc == NULL) {
1000	    xmlSAX2ErrMemory(ctxt, "xmlSAX2StartDocument");
1001	    return;
1002	}
1003#else
1004        xmlGenericError(xmlGenericErrorContext,
1005		"libxml2 built without HTML support\n");
1006	ctxt->errNo = XML_ERR_INTERNAL_ERROR;
1007	ctxt->instate = XML_PARSER_EOF;
1008	ctxt->disableSAX = 1;
1009	return;
1010#endif
1011    } else {
1012	doc = ctxt->myDoc = xmlNewDoc(ctxt->version);
1013	if (doc != NULL) {
1014	    doc->properties = 0;
1015	    if (ctxt->options & XML_PARSE_OLD10)
1016	        doc->properties |= XML_DOC_OLD10;
1017	    doc->parseFlags = ctxt->options;
1018	    if (ctxt->encoding != NULL)
1019		doc->encoding = xmlStrdup(ctxt->encoding);
1020	    else
1021		doc->encoding = NULL;
1022	    doc->standalone = ctxt->standalone;
1023	} else {
1024	    xmlSAX2ErrMemory(ctxt, "xmlSAX2StartDocument");
1025	    return;
1026	}
1027	if ((ctxt->dictNames) && (doc != NULL)) {
1028	    doc->dict = ctxt->dict;
1029	    xmlDictReference(doc->dict);
1030	}
1031    }
1032    if ((ctxt->myDoc != NULL) && (ctxt->myDoc->URL == NULL) &&
1033	(ctxt->input != NULL) && (ctxt->input->filename != NULL)) {
1034	ctxt->myDoc->URL = xmlPathToURI((const xmlChar *)ctxt->input->filename);
1035	if (ctxt->myDoc->URL == NULL)
1036	    xmlSAX2ErrMemory(ctxt, "xmlSAX2StartDocument");
1037    }
1038}
1039
1040/**
1041 * xmlSAX2EndDocument:
1042 * @ctx: the user data (XML parser context)
1043 *
1044 * called when the document end has been detected.
1045 */
1046void
1047xmlSAX2EndDocument(void *ctx)
1048{
1049    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
1050#ifdef DEBUG_SAX
1051    xmlGenericError(xmlGenericErrorContext,
1052	    "SAX.xmlSAX2EndDocument()\n");
1053#endif
1054    if (ctx == NULL) return;
1055#ifdef LIBXML_VALID_ENABLED
1056    if (ctxt->validate && ctxt->wellFormed &&
1057        ctxt->myDoc && ctxt->myDoc->intSubset)
1058	ctxt->valid &= xmlValidateDocumentFinal(&ctxt->vctxt, ctxt->myDoc);
1059#endif /* LIBXML_VALID_ENABLED */
1060
1061    /*
1062     * Grab the encoding if it was added on-the-fly
1063     */
1064    if ((ctxt->encoding != NULL) && (ctxt->myDoc != NULL) &&
1065	(ctxt->myDoc->encoding == NULL)) {
1066	ctxt->myDoc->encoding = ctxt->encoding;
1067	ctxt->encoding = NULL;
1068    }
1069    if ((ctxt->inputTab != NULL) &&
1070        (ctxt->inputNr > 0) && (ctxt->inputTab[0] != NULL) &&
1071        (ctxt->inputTab[0]->encoding != NULL) && (ctxt->myDoc != NULL) &&
1072	(ctxt->myDoc->encoding == NULL)) {
1073	ctxt->myDoc->encoding = xmlStrdup(ctxt->inputTab[0]->encoding);
1074    }
1075    if ((ctxt->charset != XML_CHAR_ENCODING_NONE) && (ctxt->myDoc != NULL) &&
1076	(ctxt->myDoc->charset == XML_CHAR_ENCODING_NONE)) {
1077	ctxt->myDoc->charset = ctxt->charset;
1078    }
1079}
1080
1081#if defined(LIBXML_SAX1_ENABLED) || defined(LIBXML_HTML_ENABLED) || defined(LIBXML_WRITER_ENABLED) || defined(LIBXML_DOCB_ENABLED)
1082/**
1083 * xmlSAX2AttributeInternal:
1084 * @ctx: the user data (XML parser context)
1085 * @fullname:  The attribute name, including namespace prefix
1086 * @value:  The attribute value
1087 * @prefix: the prefix on the element node
1088 *
1089 * Handle an attribute that has been read by the parser.
1090 * The default handling is to convert the attribute into an
1091 * DOM subtree and past it in a new xmlAttr element added to
1092 * the element.
1093 */
1094static void
1095xmlSAX2AttributeInternal(void *ctx, const xmlChar *fullname,
1096             const xmlChar *value, const xmlChar *prefix ATTRIBUTE_UNUSED)
1097{
1098    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
1099    xmlAttrPtr ret;
1100    xmlChar *name;
1101    xmlChar *ns;
1102    xmlChar *nval;
1103    xmlNsPtr namespace;
1104
1105    if (ctxt->html) {
1106	name = xmlStrdup(fullname);
1107	ns = NULL;
1108	namespace = NULL;
1109    } else {
1110	/*
1111	 * Split the full name into a namespace prefix and the tag name
1112	 */
1113	name = xmlSplitQName(ctxt, fullname, &ns);
1114	if ((name != NULL) && (name[0] == 0)) {
1115	    if (xmlStrEqual(ns, BAD_CAST "xmlns")) {
1116		xmlNsErrMsg(ctxt, XML_ERR_NS_DECL_ERROR,
1117			    "invalid namespace declaration '%s'\n",
1118			    fullname, NULL);
1119	    } else {
1120		xmlNsWarnMsg(ctxt, XML_WAR_NS_COLUMN,
1121			     "Avoid attribute ending with ':' like '%s'\n",
1122			     fullname, NULL);
1123	    }
1124	    if (ns != NULL)
1125		xmlFree(ns);
1126	    ns = NULL;
1127	    xmlFree(name);
1128	    name = xmlStrdup(fullname);
1129	}
1130    }
1131    if (name == NULL) {
1132        xmlSAX2ErrMemory(ctxt, "xmlSAX2StartElement");
1133	if (ns != NULL)
1134	    xmlFree(ns);
1135	return;
1136    }
1137
1138#ifdef LIBXML_HTML_ENABLED
1139    if ((ctxt->html) &&
1140        (value == NULL) && (htmlIsBooleanAttr(fullname))) {
1141            nval = xmlStrdup(fullname);
1142            value = (const xmlChar *) nval;
1143    } else
1144#endif
1145    {
1146#ifdef LIBXML_VALID_ENABLED
1147        /*
1148         * Do the last stage of the attribute normalization
1149         * Needed for HTML too:
1150         *   http://www.w3.org/TR/html4/types.html#h-6.2
1151         */
1152        ctxt->vctxt.valid = 1;
1153        nval = xmlValidCtxtNormalizeAttributeValue(&ctxt->vctxt,
1154                                               ctxt->myDoc, ctxt->node,
1155                                               fullname, value);
1156        if (ctxt->vctxt.valid != 1) {
1157            ctxt->valid = 0;
1158        }
1159        if (nval != NULL)
1160            value = nval;
1161#else
1162        nval = NULL;
1163#endif /* LIBXML_VALID_ENABLED */
1164    }
1165
1166    /*
1167     * Check whether it's a namespace definition
1168     */
1169    if ((!ctxt->html) && (ns == NULL) &&
1170        (name[0] == 'x') && (name[1] == 'm') && (name[2] == 'l') &&
1171        (name[3] == 'n') && (name[4] == 's') && (name[5] == 0)) {
1172	xmlNsPtr nsret;
1173	xmlChar *val;
1174
1175        if (!ctxt->replaceEntities) {
1176	    ctxt->depth++;
1177	    val = xmlStringDecodeEntities(ctxt, value, XML_SUBSTITUTE_REF,
1178		                          0,0,0);
1179	    ctxt->depth--;
1180	} else {
1181	    val = (xmlChar *) value;
1182	}
1183
1184	if (val[0] != 0) {
1185	    xmlURIPtr uri;
1186
1187	    uri = xmlParseURI((const char *)val);
1188	    if (uri == NULL) {
1189		if ((ctxt->sax != NULL) && (ctxt->sax->warning != NULL))
1190		    ctxt->sax->warning(ctxt->userData,
1191			 "xmlns: %s not a valid URI\n", val);
1192	    } else {
1193		if (uri->scheme == NULL) {
1194		    if ((ctxt->sax != NULL) && (ctxt->sax->warning != NULL))
1195			ctxt->sax->warning(ctxt->userData,
1196			     "xmlns: URI %s is not absolute\n", val);
1197		}
1198		xmlFreeURI(uri);
1199	    }
1200	}
1201
1202	/* a default namespace definition */
1203	nsret = xmlNewNs(ctxt->node, val, NULL);
1204
1205#ifdef LIBXML_VALID_ENABLED
1206	/*
1207	 * Validate also for namespace decls, they are attributes from
1208	 * an XML-1.0 perspective
1209	 */
1210        if (nsret != NULL && ctxt->validate && ctxt->wellFormed &&
1211	    ctxt->myDoc && ctxt->myDoc->intSubset)
1212	    ctxt->valid &= xmlValidateOneNamespace(&ctxt->vctxt, ctxt->myDoc,
1213					   ctxt->node, prefix, nsret, val);
1214#endif /* LIBXML_VALID_ENABLED */
1215	if (name != NULL)
1216	    xmlFree(name);
1217	if (nval != NULL)
1218	    xmlFree(nval);
1219	if (val != value)
1220	    xmlFree(val);
1221	return;
1222    }
1223    if ((!ctxt->html) &&
1224	(ns != NULL) && (ns[0] == 'x') && (ns[1] == 'm') && (ns[2] == 'l') &&
1225        (ns[3] == 'n') && (ns[4] == 's') && (ns[5] == 0)) {
1226	xmlNsPtr nsret;
1227	xmlChar *val;
1228
1229        if (!ctxt->replaceEntities) {
1230	    ctxt->depth++;
1231	    val = xmlStringDecodeEntities(ctxt, value, XML_SUBSTITUTE_REF,
1232		                          0,0,0);
1233	    ctxt->depth--;
1234	    if (val == NULL) {
1235	        xmlSAX2ErrMemory(ctxt, "xmlSAX2StartElement");
1236	        xmlFree(ns);
1237		if (name != NULL)
1238		    xmlFree(name);
1239		return;
1240	    }
1241	} else {
1242	    val = (xmlChar *) value;
1243	}
1244
1245	if (val[0] == 0) {
1246	    xmlNsErrMsg(ctxt, XML_NS_ERR_EMPTY,
1247		        "Empty namespace name for prefix %s\n", name, NULL);
1248	}
1249	if ((ctxt->pedantic != 0) && (val[0] != 0)) {
1250	    xmlURIPtr uri;
1251
1252	    uri = xmlParseURI((const char *)val);
1253	    if (uri == NULL) {
1254	        xmlNsWarnMsg(ctxt, XML_WAR_NS_URI,
1255			 "xmlns:%s: %s not a valid URI\n", name, value);
1256	    } else {
1257		if (uri->scheme == NULL) {
1258		    xmlNsWarnMsg(ctxt, XML_WAR_NS_URI_RELATIVE,
1259			   "xmlns:%s: URI %s is not absolute\n", name, value);
1260		}
1261		xmlFreeURI(uri);
1262	    }
1263	}
1264
1265	/* a standard namespace definition */
1266	nsret = xmlNewNs(ctxt->node, val, name);
1267	xmlFree(ns);
1268#ifdef LIBXML_VALID_ENABLED
1269	/*
1270	 * Validate also for namespace decls, they are attributes from
1271	 * an XML-1.0 perspective
1272	 */
1273        if (nsret != NULL && ctxt->validate && ctxt->wellFormed &&
1274	    ctxt->myDoc && ctxt->myDoc->intSubset)
1275	    ctxt->valid &= xmlValidateOneNamespace(&ctxt->vctxt, ctxt->myDoc,
1276					   ctxt->node, prefix, nsret, value);
1277#endif /* LIBXML_VALID_ENABLED */
1278	if (name != NULL)
1279	    xmlFree(name);
1280	if (nval != NULL)
1281	    xmlFree(nval);
1282	if (val != value)
1283	    xmlFree(val);
1284	return;
1285    }
1286
1287    if (ns != NULL) {
1288	namespace = xmlSearchNs(ctxt->myDoc, ctxt->node, ns);
1289
1290	if (namespace == NULL) {
1291	    xmlNsErrMsg(ctxt, XML_NS_ERR_UNDEFINED_NAMESPACE,
1292		    "Namespace prefix %s of attribute %s is not defined\n",
1293		             ns, name);
1294	} else {
1295            xmlAttrPtr prop;
1296
1297            prop = ctxt->node->properties;
1298            while (prop != NULL) {
1299                if (prop->ns != NULL) {
1300                    if ((xmlStrEqual(name, prop->name)) &&
1301                        ((namespace == prop->ns) ||
1302                         (xmlStrEqual(namespace->href, prop->ns->href)))) {
1303                            xmlNsErrMsg(ctxt, XML_ERR_ATTRIBUTE_REDEFINED,
1304                                    "Attribute %s in %s redefined\n",
1305                                             name, namespace->href);
1306                        ctxt->wellFormed = 0;
1307                        if (ctxt->recovery == 0) ctxt->disableSAX = 1;
1308                        goto error;
1309                    }
1310                }
1311                prop = prop->next;
1312            }
1313        }
1314    } else {
1315	namespace = NULL;
1316    }
1317
1318    /* !!!!!! <a toto:arg="" xmlns:toto="http://toto.com"> */
1319    ret = xmlNewNsPropEatName(ctxt->node, namespace, name, NULL);
1320
1321    if (ret != NULL) {
1322        if ((ctxt->replaceEntities == 0) && (!ctxt->html)) {
1323	    xmlNodePtr tmp;
1324
1325	    ret->children = xmlStringGetNodeList(ctxt->myDoc, value);
1326	    tmp = ret->children;
1327	    while (tmp != NULL) {
1328		tmp->parent = (xmlNodePtr) ret;
1329		if (tmp->next == NULL)
1330		    ret->last = tmp;
1331		tmp = tmp->next;
1332	    }
1333	} else if (value != NULL) {
1334	    ret->children = xmlNewDocText(ctxt->myDoc, value);
1335	    ret->last = ret->children;
1336	    if (ret->children != NULL)
1337		ret->children->parent = (xmlNodePtr) ret;
1338	}
1339    }
1340
1341#ifdef LIBXML_VALID_ENABLED
1342    if ((!ctxt->html) && ctxt->validate && ctxt->wellFormed &&
1343        ctxt->myDoc && ctxt->myDoc->intSubset) {
1344
1345	/*
1346	 * If we don't substitute entities, the validation should be
1347	 * done on a value with replaced entities anyway.
1348	 */
1349        if (!ctxt->replaceEntities) {
1350	    xmlChar *val;
1351
1352	    ctxt->depth++;
1353	    val = xmlStringDecodeEntities(ctxt, value, XML_SUBSTITUTE_REF,
1354		                          0,0,0);
1355	    ctxt->depth--;
1356
1357	    if (val == NULL)
1358		ctxt->valid &= xmlValidateOneAttribute(&ctxt->vctxt,
1359				ctxt->myDoc, ctxt->node, ret, value);
1360	    else {
1361		xmlChar *nvalnorm;
1362
1363		/*
1364		 * Do the last stage of the attribute normalization
1365		 * It need to be done twice ... it's an extra burden related
1366		 * to the ability to keep xmlSAX2References in attributes
1367		 */
1368		nvalnorm = xmlValidNormalizeAttributeValue(ctxt->myDoc,
1369					    ctxt->node, fullname, val);
1370		if (nvalnorm != NULL) {
1371		    xmlFree(val);
1372		    val = nvalnorm;
1373		}
1374
1375		ctxt->valid &= xmlValidateOneAttribute(&ctxt->vctxt,
1376			        ctxt->myDoc, ctxt->node, ret, val);
1377                xmlFree(val);
1378	    }
1379	} else {
1380	    ctxt->valid &= xmlValidateOneAttribute(&ctxt->vctxt, ctxt->myDoc,
1381					       ctxt->node, ret, value);
1382	}
1383    } else
1384#endif /* LIBXML_VALID_ENABLED */
1385           if (((ctxt->loadsubset & XML_SKIP_IDS) == 0) &&
1386	       (((ctxt->replaceEntities == 0) && (ctxt->external != 2)) ||
1387	        ((ctxt->replaceEntities != 0) && (ctxt->inSubset == 0)))) {
1388        /*
1389	 * when validating, the ID registration is done at the attribute
1390	 * validation level. Otherwise we have to do specific handling here.
1391	 */
1392	if (xmlStrEqual(fullname, BAD_CAST "xml:id")) {
1393	    /*
1394	     * Add the xml:id value
1395	     *
1396	     * Open issue: normalization of the value.
1397	     */
1398	    if (xmlValidateNCName(value, 1) != 0) {
1399	        xmlErrValid(ctxt, XML_DTD_XMLID_VALUE,
1400		      "xml:id : attribute value %s is not an NCName\n",
1401			    (const char *) value, NULL);
1402	    }
1403	    xmlAddID(&ctxt->vctxt, ctxt->myDoc, value, ret);
1404	} else if (xmlIsID(ctxt->myDoc, ctxt->node, ret))
1405	    xmlAddID(&ctxt->vctxt, ctxt->myDoc, value, ret);
1406	else if (xmlIsRef(ctxt->myDoc, ctxt->node, ret))
1407	    xmlAddRef(&ctxt->vctxt, ctxt->myDoc, value, ret);
1408    }
1409
1410error:
1411    if (nval != NULL)
1412	xmlFree(nval);
1413    if (ns != NULL)
1414	xmlFree(ns);
1415}
1416
1417/*
1418 * xmlCheckDefaultedAttributes:
1419 *
1420 * Check defaulted attributes from the DTD
1421 */
1422static void
1423xmlCheckDefaultedAttributes(xmlParserCtxtPtr ctxt, const xmlChar *name,
1424	const xmlChar *prefix, const xmlChar **atts) {
1425    xmlElementPtr elemDecl;
1426    const xmlChar *att;
1427    int internal = 1;
1428    int i;
1429
1430    elemDecl = xmlGetDtdQElementDesc(ctxt->myDoc->intSubset, name, prefix);
1431    if (elemDecl == NULL) {
1432	elemDecl = xmlGetDtdQElementDesc(ctxt->myDoc->extSubset, name, prefix);
1433	internal = 0;
1434    }
1435
1436process_external_subset:
1437
1438    if (elemDecl != NULL) {
1439	xmlAttributePtr attr = elemDecl->attributes;
1440	/*
1441	 * Check against defaulted attributes from the external subset
1442	 * if the document is stamped as standalone
1443	 */
1444	if ((ctxt->myDoc->standalone == 1) &&
1445	    (ctxt->myDoc->extSubset != NULL) &&
1446	    (ctxt->validate)) {
1447	    while (attr != NULL) {
1448		if ((attr->defaultValue != NULL) &&
1449		    (xmlGetDtdQAttrDesc(ctxt->myDoc->extSubset,
1450					attr->elem, attr->name,
1451					attr->prefix) == attr) &&
1452		    (xmlGetDtdQAttrDesc(ctxt->myDoc->intSubset,
1453					attr->elem, attr->name,
1454					attr->prefix) == NULL)) {
1455		    xmlChar *fulln;
1456
1457		    if (attr->prefix != NULL) {
1458			fulln = xmlStrdup(attr->prefix);
1459			fulln = xmlStrcat(fulln, BAD_CAST ":");
1460			fulln = xmlStrcat(fulln, attr->name);
1461		    } else {
1462			fulln = xmlStrdup(attr->name);
1463		    }
1464                    if (fulln == NULL) {
1465                        xmlSAX2ErrMemory(ctxt, "xmlSAX2StartElement");
1466                        break;
1467                    }
1468
1469		    /*
1470		     * Check that the attribute is not declared in the
1471		     * serialization
1472		     */
1473		    att = NULL;
1474		    if (atts != NULL) {
1475			i = 0;
1476			att = atts[i];
1477			while (att != NULL) {
1478			    if (xmlStrEqual(att, fulln))
1479				break;
1480			    i += 2;
1481			    att = atts[i];
1482			}
1483		    }
1484		    if (att == NULL) {
1485		        xmlErrValid(ctxt, XML_DTD_STANDALONE_DEFAULTED,
1486      "standalone: attribute %s on %s defaulted from external subset\n",
1487				    (const char *)fulln,
1488				    (const char *)attr->elem);
1489		    }
1490                    xmlFree(fulln);
1491		}
1492		attr = attr->nexth;
1493	    }
1494	}
1495
1496	/*
1497	 * Actually insert defaulted values when needed
1498	 */
1499	attr = elemDecl->attributes;
1500	while (attr != NULL) {
1501	    /*
1502	     * Make sure that attributes redefinition occuring in the
1503	     * internal subset are not overriden by definitions in the
1504	     * external subset.
1505	     */
1506	    if (attr->defaultValue != NULL) {
1507		/*
1508		 * the element should be instantiated in the tree if:
1509		 *  - this is a namespace prefix
1510		 *  - the user required for completion in the tree
1511		 *    like XSLT
1512		 *  - there isn't already an attribute definition
1513		 *    in the internal subset overriding it.
1514		 */
1515		if (((attr->prefix != NULL) &&
1516		     (xmlStrEqual(attr->prefix, BAD_CAST "xmlns"))) ||
1517		    ((attr->prefix == NULL) &&
1518		     (xmlStrEqual(attr->name, BAD_CAST "xmlns"))) ||
1519		    (ctxt->loadsubset & XML_COMPLETE_ATTRS)) {
1520		    xmlAttributePtr tst;
1521
1522		    tst = xmlGetDtdQAttrDesc(ctxt->myDoc->intSubset,
1523					     attr->elem, attr->name,
1524					     attr->prefix);
1525		    if ((tst == attr) || (tst == NULL)) {
1526		        xmlChar fn[50];
1527			xmlChar *fulln;
1528
1529                        fulln = xmlBuildQName(attr->name, attr->prefix, fn, 50);
1530			if (fulln == NULL) {
1531			    xmlSAX2ErrMemory(ctxt, "xmlSAX2StartElement");
1532			    return;
1533			}
1534
1535			/*
1536			 * Check that the attribute is not declared in the
1537			 * serialization
1538			 */
1539			att = NULL;
1540			if (atts != NULL) {
1541			    i = 0;
1542			    att = atts[i];
1543			    while (att != NULL) {
1544				if (xmlStrEqual(att, fulln))
1545				    break;
1546				i += 2;
1547				att = atts[i];
1548			    }
1549			}
1550			if (att == NULL) {
1551			    xmlSAX2AttributeInternal(ctxt, fulln,
1552						 attr->defaultValue, prefix);
1553			}
1554			if ((fulln != fn) && (fulln != attr->name))
1555			    xmlFree(fulln);
1556		    }
1557		}
1558	    }
1559	    attr = attr->nexth;
1560	}
1561	if (internal == 1) {
1562	    elemDecl = xmlGetDtdQElementDesc(ctxt->myDoc->extSubset,
1563		                             name, prefix);
1564	    internal = 0;
1565	    goto process_external_subset;
1566	}
1567    }
1568}
1569
1570/**
1571 * xmlSAX2StartElement:
1572 * @ctx: the user data (XML parser context)
1573 * @fullname:  The element name, including namespace prefix
1574 * @atts:  An array of name/value attributes pairs, NULL terminated
1575 *
1576 * called when an opening tag has been processed.
1577 */
1578void
1579xmlSAX2StartElement(void *ctx, const xmlChar *fullname, const xmlChar **atts)
1580{
1581    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
1582    xmlNodePtr ret;
1583    xmlNodePtr parent;
1584    xmlNsPtr ns;
1585    xmlChar *name;
1586    xmlChar *prefix;
1587    const xmlChar *att;
1588    const xmlChar *value;
1589    int i;
1590
1591    if ((ctx == NULL) || (fullname == NULL) || (ctxt->myDoc == NULL)) return;
1592    parent = ctxt->node;
1593#ifdef DEBUG_SAX
1594    xmlGenericError(xmlGenericErrorContext,
1595	    "SAX.xmlSAX2StartElement(%s)\n", fullname);
1596#endif
1597
1598    /*
1599     * First check on validity:
1600     */
1601    if (ctxt->validate && (ctxt->myDoc->extSubset == NULL) &&
1602        ((ctxt->myDoc->intSubset == NULL) ||
1603	 ((ctxt->myDoc->intSubset->notations == NULL) &&
1604	  (ctxt->myDoc->intSubset->elements == NULL) &&
1605	  (ctxt->myDoc->intSubset->attributes == NULL) &&
1606	  (ctxt->myDoc->intSubset->entities == NULL)))) {
1607	xmlErrValid(ctxt, XML_ERR_NO_DTD,
1608	  "Validation failed: no DTD found !", NULL, NULL);
1609	ctxt->validate = 0;
1610    }
1611
1612
1613    /*
1614     * Split the full name into a namespace prefix and the tag name
1615     */
1616    name = xmlSplitQName(ctxt, fullname, &prefix);
1617
1618
1619    /*
1620     * Note : the namespace resolution is deferred until the end of the
1621     *        attributes parsing, since local namespace can be defined as
1622     *        an attribute at this level.
1623     */
1624    ret = xmlNewDocNodeEatName(ctxt->myDoc, NULL, name, NULL);
1625    if (ret == NULL) {
1626        if (prefix != NULL)
1627	    xmlFree(prefix);
1628	xmlSAX2ErrMemory(ctxt, "xmlSAX2StartElement");
1629        return;
1630    }
1631    if (ctxt->myDoc->children == NULL) {
1632#ifdef DEBUG_SAX_TREE
1633	xmlGenericError(xmlGenericErrorContext, "Setting %s as root\n", name);
1634#endif
1635        xmlAddChild((xmlNodePtr) ctxt->myDoc, (xmlNodePtr) ret);
1636    } else if (parent == NULL) {
1637        parent = ctxt->myDoc->children;
1638    }
1639    ctxt->nodemem = -1;
1640    if (ctxt->linenumbers) {
1641	if (ctxt->input != NULL) {
1642	    if (ctxt->input->line < 65535)
1643		ret->line = (short) ctxt->input->line;
1644	    else
1645	        ret->line = 65535;
1646	}
1647    }
1648
1649    /*
1650     * We are parsing a new node.
1651     */
1652#ifdef DEBUG_SAX_TREE
1653    xmlGenericError(xmlGenericErrorContext, "pushing(%s)\n", name);
1654#endif
1655    nodePush(ctxt, ret);
1656
1657    /*
1658     * Link the child element
1659     */
1660    if (parent != NULL) {
1661        if (parent->type == XML_ELEMENT_NODE) {
1662#ifdef DEBUG_SAX_TREE
1663	    xmlGenericError(xmlGenericErrorContext,
1664		    "adding child %s to %s\n", name, parent->name);
1665#endif
1666	    xmlAddChild(parent, ret);
1667	} else {
1668#ifdef DEBUG_SAX_TREE
1669	    xmlGenericError(xmlGenericErrorContext,
1670		    "adding sibling %s to ", name);
1671	    xmlDebugDumpOneNode(stderr, parent, 0);
1672#endif
1673	    xmlAddSibling(parent, ret);
1674	}
1675    }
1676
1677    /*
1678     * Insert all the defaulted attributes from the DTD especially namespaces
1679     */
1680    if ((!ctxt->html) &&
1681	((ctxt->myDoc->intSubset != NULL) ||
1682	 (ctxt->myDoc->extSubset != NULL))) {
1683	xmlCheckDefaultedAttributes(ctxt, name, prefix, atts);
1684    }
1685
1686    /*
1687     * process all the attributes whose name start with "xmlns"
1688     */
1689    if (atts != NULL) {
1690        i = 0;
1691	att = atts[i++];
1692	value = atts[i++];
1693	if (!ctxt->html) {
1694	    while ((att != NULL) && (value != NULL)) {
1695		if ((att[0] == 'x') && (att[1] == 'm') && (att[2] == 'l') &&
1696		    (att[3] == 'n') && (att[4] == 's'))
1697		    xmlSAX2AttributeInternal(ctxt, att, value, prefix);
1698
1699		att = atts[i++];
1700		value = atts[i++];
1701	    }
1702	}
1703    }
1704
1705    /*
1706     * Search the namespace, note that since the attributes have been
1707     * processed, the local namespaces are available.
1708     */
1709    ns = xmlSearchNs(ctxt->myDoc, ret, prefix);
1710    if ((ns == NULL) && (parent != NULL))
1711	ns = xmlSearchNs(ctxt->myDoc, parent, prefix);
1712    if ((prefix != NULL) && (ns == NULL)) {
1713	ns = xmlNewNs(ret, NULL, prefix);
1714	xmlNsWarnMsg(ctxt, XML_NS_ERR_UNDEFINED_NAMESPACE,
1715		     "Namespace prefix %s is not defined\n",
1716		     prefix, NULL);
1717    }
1718
1719    /*
1720     * set the namespace node, making sure that if the default namspace
1721     * is unbound on a parent we simply kee it NULL
1722     */
1723    if ((ns != NULL) && (ns->href != NULL) &&
1724	((ns->href[0] != 0) || (ns->prefix != NULL)))
1725	xmlSetNs(ret, ns);
1726
1727    /*
1728     * process all the other attributes
1729     */
1730    if (atts != NULL) {
1731        i = 0;
1732	att = atts[i++];
1733	value = atts[i++];
1734	if (ctxt->html) {
1735	    while (att != NULL) {
1736		xmlSAX2AttributeInternal(ctxt, att, value, NULL);
1737		att = atts[i++];
1738		value = atts[i++];
1739	    }
1740	} else {
1741	    while ((att != NULL) && (value != NULL)) {
1742		if ((att[0] != 'x') || (att[1] != 'm') || (att[2] != 'l') ||
1743		    (att[3] != 'n') || (att[4] != 's'))
1744		    xmlSAX2AttributeInternal(ctxt, att, value, NULL);
1745
1746		/*
1747		 * Next ones
1748		 */
1749		att = atts[i++];
1750		value = atts[i++];
1751	    }
1752	}
1753    }
1754
1755#ifdef LIBXML_VALID_ENABLED
1756    /*
1757     * If it's the Document root, finish the DTD validation and
1758     * check the document root element for validity
1759     */
1760    if ((ctxt->validate) && (ctxt->vctxt.finishDtd == XML_CTXT_FINISH_DTD_0)) {
1761	int chk;
1762
1763	chk = xmlValidateDtdFinal(&ctxt->vctxt, ctxt->myDoc);
1764	if (chk <= 0)
1765	    ctxt->valid = 0;
1766	if (chk < 0)
1767	    ctxt->wellFormed = 0;
1768	ctxt->valid &= xmlValidateRoot(&ctxt->vctxt, ctxt->myDoc);
1769	ctxt->vctxt.finishDtd = XML_CTXT_FINISH_DTD_1;
1770    }
1771#endif /* LIBXML_VALID_ENABLED */
1772
1773    if (prefix != NULL)
1774	xmlFree(prefix);
1775
1776}
1777
1778/**
1779 * xmlSAX2EndElement:
1780 * @ctx: the user data (XML parser context)
1781 * @name:  The element name
1782 *
1783 * called when the end of an element has been detected.
1784 */
1785void
1786xmlSAX2EndElement(void *ctx, const xmlChar *name ATTRIBUTE_UNUSED)
1787{
1788    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
1789    xmlNodePtr cur;
1790
1791    if (ctx == NULL) return;
1792    cur = ctxt->node;
1793#ifdef DEBUG_SAX
1794    if (name == NULL)
1795        xmlGenericError(xmlGenericErrorContext, "SAX.xmlSAX2EndElement(NULL)\n");
1796    else
1797	xmlGenericError(xmlGenericErrorContext, "SAX.xmlSAX2EndElement(%s)\n", name);
1798#endif
1799
1800    /* Capture end position and add node */
1801    if (cur != NULL && ctxt->record_info) {
1802      ctxt->nodeInfo->end_pos = ctxt->input->cur - ctxt->input->base;
1803      ctxt->nodeInfo->end_line = ctxt->input->line;
1804      ctxt->nodeInfo->node = cur;
1805      xmlParserAddNodeInfo(ctxt, ctxt->nodeInfo);
1806    }
1807    ctxt->nodemem = -1;
1808
1809#ifdef LIBXML_VALID_ENABLED
1810    if (ctxt->validate && ctxt->wellFormed &&
1811        ctxt->myDoc && ctxt->myDoc->intSubset)
1812        ctxt->valid &= xmlValidateOneElement(&ctxt->vctxt, ctxt->myDoc,
1813					     cur);
1814#endif /* LIBXML_VALID_ENABLED */
1815
1816
1817    /*
1818     * end of parsing of this node.
1819     */
1820#ifdef DEBUG_SAX_TREE
1821    xmlGenericError(xmlGenericErrorContext, "popping(%s)\n", cur->name);
1822#endif
1823    nodePop(ctxt);
1824}
1825#endif /* LIBXML_SAX1_ENABLED || LIBXML_HTML_ENABLE */
1826
1827/*
1828 * xmlSAX2TextNode:
1829 * @ctxt:  the parser context
1830 * @str:  the input string
1831 * @len: the string length
1832 *
1833 * Callback for a text node
1834 *
1835 * Returns the newly allocated string or NULL if not needed or error
1836 */
1837static xmlNodePtr
1838xmlSAX2TextNode(xmlParserCtxtPtr ctxt, const xmlChar *str, int len) {
1839    xmlNodePtr ret;
1840    const xmlChar *intern = NULL;
1841
1842    /*
1843     * Allocate
1844     */
1845    if (ctxt->freeElems != NULL) {
1846	ret = ctxt->freeElems;
1847	ctxt->freeElems = ret->next;
1848	ctxt->freeElemsNr--;
1849    } else {
1850	ret = (xmlNodePtr) xmlMalloc(sizeof(xmlNode));
1851    }
1852    if (ret == NULL) {
1853        xmlErrMemory(ctxt, "xmlSAX2Characters");
1854	return(NULL);
1855    }
1856    memset(ret, 0, sizeof(xmlNode));
1857    /*
1858     * intern the formatting blanks found between tags, or the
1859     * very short strings
1860     */
1861    if (ctxt->dictNames) {
1862        xmlChar cur = str[len];
1863
1864	if ((len < (int) (2 * sizeof(void *))) &&
1865	    (ctxt->options & XML_PARSE_COMPACT)) {
1866	    /* store the string in the node overriding properties and nsDef */
1867	    xmlChar *tmp = (xmlChar *) &(ret->properties);
1868	    memcpy(tmp, str, len);
1869	    tmp[len] = 0;
1870	    intern = tmp;
1871	} else if ((len <= 3) && ((cur == '"') || (cur == '\'') ||
1872	    ((cur == '<') && (str[len + 1] != '!')))) {
1873	    intern = xmlDictLookup(ctxt->dict, str, len);
1874	} else if (IS_BLANK_CH(*str) && (len < 60) && (cur == '<') &&
1875	           (str[len + 1] != '!')) {
1876	    int i;
1877
1878	    for (i = 1;i < len;i++) {
1879		if (!IS_BLANK_CH(str[i])) goto skip;
1880	    }
1881	    intern = xmlDictLookup(ctxt->dict, str, len);
1882	}
1883    }
1884skip:
1885    ret->type = XML_TEXT_NODE;
1886
1887    ret->name = xmlStringText;
1888    if (intern == NULL) {
1889	ret->content = xmlStrndup(str, len);
1890	if (ret->content == NULL) {
1891	    xmlSAX2ErrMemory(ctxt, "xmlSAX2TextNode");
1892	    xmlFree(ret);
1893	    return(NULL);
1894	}
1895    } else
1896	ret->content = (xmlChar *) intern;
1897
1898    if (ctxt->linenumbers) {
1899	if (ctxt->input != NULL) {
1900	    if (ctxt->input->line < 65535)
1901		ret->line = (short) ctxt->input->line;
1902	    else {
1903	        ret->line = 65535;
1904		if (ctxt->options & XML_PARSE_BIG_LINES)
1905		    ret->psvi = (void *) (long) ctxt->input->line;
1906	    }
1907	}
1908    }
1909
1910    if ((__xmlRegisterCallbacks) && (xmlRegisterNodeDefaultValue))
1911	xmlRegisterNodeDefaultValue(ret);
1912    return(ret);
1913}
1914
1915#ifdef LIBXML_VALID_ENABLED
1916/*
1917 * xmlSAX2DecodeAttrEntities:
1918 * @ctxt:  the parser context
1919 * @str:  the input string
1920 * @len: the string length
1921 *
1922 * Remove the entities from an attribute value
1923 *
1924 * Returns the newly allocated string or NULL if not needed or error
1925 */
1926static xmlChar *
1927xmlSAX2DecodeAttrEntities(xmlParserCtxtPtr ctxt, const xmlChar *str,
1928                          const xmlChar *end) {
1929    const xmlChar *in;
1930    xmlChar *ret;
1931
1932    in = str;
1933    while (in < end)
1934        if (*in++ == '&')
1935	    goto decode;
1936    return(NULL);
1937decode:
1938    ctxt->depth++;
1939    ret = xmlStringLenDecodeEntities(ctxt, str, end - str,
1940				     XML_SUBSTITUTE_REF, 0,0,0);
1941    ctxt->depth--;
1942    return(ret);
1943}
1944#endif /* LIBXML_VALID_ENABLED */
1945
1946/**
1947 * xmlSAX2AttributeNs:
1948 * @ctx: the user data (XML parser context)
1949 * @localname:  the local name of the attribute
1950 * @prefix:  the attribute namespace prefix if available
1951 * @URI:  the attribute namespace name if available
1952 * @value:  Start of the attribute value
1953 * @valueend: end of the attribute value
1954 *
1955 * Handle an attribute that has been read by the parser.
1956 * The default handling is to convert the attribute into an
1957 * DOM subtree and past it in a new xmlAttr element added to
1958 * the element.
1959 */
1960static void
1961xmlSAX2AttributeNs(xmlParserCtxtPtr ctxt,
1962                   const xmlChar * localname,
1963                   const xmlChar * prefix,
1964		   const xmlChar * value,
1965		   const xmlChar * valueend)
1966{
1967    xmlAttrPtr ret;
1968    xmlNsPtr namespace = NULL;
1969    xmlChar *dup = NULL;
1970
1971    /*
1972     * Note: if prefix == NULL, the attribute is not in the default namespace
1973     */
1974    if (prefix != NULL)
1975	namespace = xmlSearchNs(ctxt->myDoc, ctxt->node, prefix);
1976
1977    /*
1978     * allocate the node
1979     */
1980    if (ctxt->freeAttrs != NULL) {
1981        ret = ctxt->freeAttrs;
1982	ctxt->freeAttrs = ret->next;
1983	ctxt->freeAttrsNr--;
1984	memset(ret, 0, sizeof(xmlAttr));
1985	ret->type = XML_ATTRIBUTE_NODE;
1986
1987	ret->parent = ctxt->node;
1988	ret->doc = ctxt->myDoc;
1989	ret->ns = namespace;
1990
1991	if (ctxt->dictNames)
1992	    ret->name = localname;
1993	else
1994	    ret->name = xmlStrdup(localname);
1995
1996        /* link at the end to preserv order, TODO speed up with a last */
1997	if (ctxt->node->properties == NULL) {
1998	    ctxt->node->properties = ret;
1999	} else {
2000	    xmlAttrPtr prev = ctxt->node->properties;
2001
2002	    while (prev->next != NULL) prev = prev->next;
2003	    prev->next = ret;
2004	    ret->prev = prev;
2005	}
2006
2007	if ((__xmlRegisterCallbacks) && (xmlRegisterNodeDefaultValue))
2008	    xmlRegisterNodeDefaultValue((xmlNodePtr)ret);
2009    } else {
2010	if (ctxt->dictNames)
2011	    ret = xmlNewNsPropEatName(ctxt->node, namespace,
2012	                              (xmlChar *) localname, NULL);
2013	else
2014	    ret = xmlNewNsProp(ctxt->node, namespace, localname, NULL);
2015	if (ret == NULL) {
2016	    xmlErrMemory(ctxt, "xmlSAX2AttributeNs");
2017	    return;
2018	}
2019    }
2020
2021    if ((ctxt->replaceEntities == 0) && (!ctxt->html)) {
2022	xmlNodePtr tmp;
2023
2024	/*
2025	 * We know that if there is an entity reference, then
2026	 * the string has been dup'ed and terminates with 0
2027	 * otherwise with ' or "
2028	 */
2029	if (*valueend != 0) {
2030	    tmp = xmlSAX2TextNode(ctxt, value, valueend - value);
2031	    ret->children = tmp;
2032	    ret->last = tmp;
2033	    if (tmp != NULL) {
2034		tmp->doc = ret->doc;
2035		tmp->parent = (xmlNodePtr) ret;
2036	    }
2037	} else {
2038	    ret->children = xmlStringLenGetNodeList(ctxt->myDoc, value,
2039						    valueend - value);
2040	    tmp = ret->children;
2041	    while (tmp != NULL) {
2042	        tmp->doc = ret->doc;
2043		tmp->parent = (xmlNodePtr) ret;
2044		if (tmp->next == NULL)
2045		    ret->last = tmp;
2046		tmp = tmp->next;
2047	    }
2048	}
2049    } else if (value != NULL) {
2050	xmlNodePtr tmp;
2051
2052	tmp = xmlSAX2TextNode(ctxt, value, valueend - value);
2053	ret->children = tmp;
2054	ret->last = tmp;
2055	if (tmp != NULL) {
2056	    tmp->doc = ret->doc;
2057	    tmp->parent = (xmlNodePtr) ret;
2058	}
2059    }
2060
2061#ifdef LIBXML_VALID_ENABLED
2062    if ((!ctxt->html) && ctxt->validate && ctxt->wellFormed &&
2063        ctxt->myDoc && ctxt->myDoc->intSubset) {
2064	/*
2065	 * If we don't substitute entities, the validation should be
2066	 * done on a value with replaced entities anyway.
2067	 */
2068        if (!ctxt->replaceEntities) {
2069	    dup = xmlSAX2DecodeAttrEntities(ctxt, value, valueend);
2070	    if (dup == NULL) {
2071	        if (*valueend == 0) {
2072		    ctxt->valid &= xmlValidateOneAttribute(&ctxt->vctxt,
2073				    ctxt->myDoc, ctxt->node, ret, value);
2074		} else {
2075		    /*
2076		     * That should already be normalized.
2077		     * cheaper to finally allocate here than duplicate
2078		     * entry points in the full validation code
2079		     */
2080		    dup = xmlStrndup(value, valueend - value);
2081
2082		    ctxt->valid &= xmlValidateOneAttribute(&ctxt->vctxt,
2083				    ctxt->myDoc, ctxt->node, ret, dup);
2084		}
2085	    } else {
2086	        /*
2087		 * dup now contains a string of the flattened attribute
2088		 * content with entities substitued. Check if we need to
2089		 * apply an extra layer of normalization.
2090		 * It need to be done twice ... it's an extra burden related
2091		 * to the ability to keep references in attributes
2092		 */
2093		if (ctxt->attsSpecial != NULL) {
2094		    xmlChar *nvalnorm;
2095		    xmlChar fn[50];
2096		    xmlChar *fullname;
2097
2098		    fullname = xmlBuildQName(localname, prefix, fn, 50);
2099		    if (fullname != NULL) {
2100			ctxt->vctxt.valid = 1;
2101		        nvalnorm = xmlValidCtxtNormalizeAttributeValue(
2102			                 &ctxt->vctxt, ctxt->myDoc,
2103					 ctxt->node, fullname, dup);
2104			if (ctxt->vctxt.valid != 1)
2105			    ctxt->valid = 0;
2106
2107			if ((fullname != fn) && (fullname != localname))
2108			    xmlFree(fullname);
2109			if (nvalnorm != NULL) {
2110			    xmlFree(dup);
2111			    dup = nvalnorm;
2112			}
2113		    }
2114		}
2115
2116		ctxt->valid &= xmlValidateOneAttribute(&ctxt->vctxt,
2117			        ctxt->myDoc, ctxt->node, ret, dup);
2118	    }
2119	} else {
2120	    /*
2121	     * if entities already have been substitued, then
2122	     * the attribute as passed is already normalized
2123	     */
2124	    dup = xmlStrndup(value, valueend - value);
2125
2126	    ctxt->valid &= xmlValidateOneAttribute(&ctxt->vctxt,
2127	                             ctxt->myDoc, ctxt->node, ret, dup);
2128	}
2129    } else
2130#endif /* LIBXML_VALID_ENABLED */
2131           if (((ctxt->loadsubset & XML_SKIP_IDS) == 0) &&
2132	       (((ctxt->replaceEntities == 0) && (ctxt->external != 2)) ||
2133	        ((ctxt->replaceEntities != 0) && (ctxt->inSubset == 0)))) {
2134        /*
2135	 * when validating, the ID registration is done at the attribute
2136	 * validation level. Otherwise we have to do specific handling here.
2137	 */
2138        if ((prefix == ctxt->str_xml) &&
2139	           (localname[0] == 'i') && (localname[1] == 'd') &&
2140		   (localname[2] == 0)) {
2141	    /*
2142	     * Add the xml:id value
2143	     *
2144	     * Open issue: normalization of the value.
2145	     */
2146	    if (dup == NULL)
2147	        dup = xmlStrndup(value, valueend - value);
2148#ifdef LIBXML_VALID_ENABLED
2149	    if (xmlValidateNCName(dup, 1) != 0) {
2150	        xmlErrValid(ctxt, XML_DTD_XMLID_VALUE,
2151		      "xml:id : attribute value %s is not an NCName\n",
2152			    (const char *) dup, NULL);
2153	    }
2154#endif
2155	    xmlAddID(&ctxt->vctxt, ctxt->myDoc, dup, ret);
2156	} else if (xmlIsID(ctxt->myDoc, ctxt->node, ret)) {
2157	    /* might be worth duplicate entry points and not copy */
2158	    if (dup == NULL)
2159	        dup = xmlStrndup(value, valueend - value);
2160	    xmlAddID(&ctxt->vctxt, ctxt->myDoc, dup, ret);
2161	} else if (xmlIsRef(ctxt->myDoc, ctxt->node, ret)) {
2162	    if (dup == NULL)
2163	        dup = xmlStrndup(value, valueend - value);
2164	    xmlAddRef(&ctxt->vctxt, ctxt->myDoc, dup, ret);
2165	}
2166    }
2167    if (dup != NULL)
2168	xmlFree(dup);
2169}
2170
2171#ifdef __APPLE__
2172#include <dispatch/dispatch.h>
2173#include <mach-o/dyld.h>
2174
2175extern int dyld_get_program_sdk_version(void);
2176#define DYLD_MACOSX_VERSION_10_9 0x000A0900
2177
2178// libxml2 v2.9 changed how elements with undeclared namespace prefixes are handled, an error case that has undefined behavior,
2179// in such a way that broke Microsoft Document Connection. Detect Microsoft Document Connection and mimic the old behavior.
2180static bool evaluateStartElementNSNeedsUndeclaredPrefixQuirk(void)
2181{
2182    const char* executablePath = _dyld_get_image_name(0);
2183    if (!executablePath)
2184        return false;
2185
2186    // Find the base name portion of the path.
2187    const char* executableName = strrchr(executablePath, '/');
2188    if (!executableName)
2189        return false;
2190
2191    // Move past the slash.
2192    executableName++;
2193
2194    if (strcmp(executableName, "Microsoft Document Connection"))
2195        return false;
2196
2197    // Apply the workaround if the application was linked against an SDK prior to where
2198    // libxml2 v2.9 was present.
2199    return dyld_get_program_sdk_version() < DYLD_MACOSX_VERSION_10_9;
2200}
2201
2202static bool startElementNSNeedsUndeclaredPrefixQuirk(void)
2203{
2204    static bool needsQuirk;
2205    static dispatch_once_t hasEvaluatedQuirk;
2206    dispatch_once(&hasEvaluatedQuirk, ^{
2207        needsQuirk = evaluateStartElementNSNeedsUndeclaredPrefixQuirk();
2208    });
2209
2210    return needsQuirk;
2211}
2212
2213#endif
2214
2215/**
2216 * xmlSAX2StartElementNs:
2217 * @ctx:  the user data (XML parser context)
2218 * @localname:  the local name of the element
2219 * @prefix:  the element namespace prefix if available
2220 * @URI:  the element namespace name if available
2221 * @nb_namespaces:  number of namespace definitions on that node
2222 * @namespaces:  pointer to the array of prefix/URI pairs namespace definitions
2223 * @nb_attributes:  the number of attributes on that node
2224 * @nb_defaulted:  the number of defaulted attributes.
2225 * @attributes:  pointer to the array of (localname/prefix/URI/value/end)
2226 *               attribute values.
2227 *
2228 * SAX2 callback when an element start has been detected by the parser.
2229 * It provides the namespace informations for the element, as well as
2230 * the new namespace declarations on the element.
2231 */
2232void
2233xmlSAX2StartElementNs(void *ctx,
2234                      const xmlChar *localname,
2235		      const xmlChar *prefix,
2236		      const xmlChar *URI,
2237		      int nb_namespaces,
2238		      const xmlChar **namespaces,
2239		      int nb_attributes,
2240		      int nb_defaulted,
2241		      const xmlChar **attributes)
2242{
2243    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
2244    xmlNodePtr ret;
2245    xmlNodePtr parent;
2246    xmlNsPtr last = NULL, ns;
2247    const xmlChar *uri, *pref;
2248    xmlChar *lname = NULL;
2249    int i, j;
2250
2251    if (ctx == NULL) return;
2252    parent = ctxt->node;
2253    /*
2254     * First check on validity:
2255     */
2256    if (ctxt->validate && (ctxt->myDoc->extSubset == NULL) &&
2257        ((ctxt->myDoc->intSubset == NULL) ||
2258	 ((ctxt->myDoc->intSubset->notations == NULL) &&
2259	  (ctxt->myDoc->intSubset->elements == NULL) &&
2260	  (ctxt->myDoc->intSubset->attributes == NULL) &&
2261	  (ctxt->myDoc->intSubset->entities == NULL)))) {
2262	xmlErrValid(ctxt, XML_DTD_NO_DTD,
2263	  "Validation failed: no DTD found !", NULL, NULL);
2264	ctxt->validate = 0;
2265    }
2266
2267#ifdef __APPLE__
2268    if (!startElementNSNeedsUndeclaredPrefixQuirk()) {
2269#endif
2270    /*
2271     * Take care of the rare case of an undefined namespace prefix
2272     */
2273    if ((prefix != NULL) && (URI == NULL)) {
2274        if (ctxt->dictNames) {
2275	    const xmlChar *fullname;
2276
2277	    fullname = xmlDictQLookup(ctxt->dict, prefix, localname);
2278	    if (fullname != NULL)
2279	        localname = fullname;
2280	} else {
2281	    lname = xmlBuildQName(localname, prefix, NULL, 0);
2282	}
2283    }
2284#ifdef __APPLE__
2285    }
2286#endif
2287    /*
2288     * allocate the node
2289     */
2290    if (ctxt->freeElems != NULL) {
2291        ret = ctxt->freeElems;
2292	ctxt->freeElems = ret->next;
2293	ctxt->freeElemsNr--;
2294	memset(ret, 0, sizeof(xmlNode));
2295	ret->type = XML_ELEMENT_NODE;
2296
2297	if (ctxt->dictNames)
2298	    ret->name = localname;
2299	else {
2300	    if (lname == NULL)
2301		ret->name = xmlStrdup(localname);
2302	    else
2303	        ret->name = lname;
2304	    if (ret->name == NULL) {
2305	        xmlSAX2ErrMemory(ctxt, "xmlSAX2StartElementNs");
2306		return;
2307	    }
2308	}
2309	if ((__xmlRegisterCallbacks) && (xmlRegisterNodeDefaultValue))
2310	    xmlRegisterNodeDefaultValue(ret);
2311    } else {
2312	if (ctxt->dictNames)
2313	    ret = xmlNewDocNodeEatName(ctxt->myDoc, NULL,
2314	                               (xmlChar *) localname, NULL);
2315	else if (lname == NULL)
2316	    ret = xmlNewDocNode(ctxt->myDoc, NULL, localname, NULL);
2317	else
2318	    ret = xmlNewDocNodeEatName(ctxt->myDoc, NULL,
2319	                               (xmlChar *) lname, NULL);
2320	if (ret == NULL) {
2321	    xmlSAX2ErrMemory(ctxt, "xmlSAX2StartElementNs");
2322	    return;
2323	}
2324    }
2325    if (ctxt->linenumbers) {
2326	if (ctxt->input != NULL) {
2327	    if (ctxt->input->line < 65535)
2328		ret->line = (short) ctxt->input->line;
2329	    else
2330	        ret->line = 65535;
2331	}
2332    }
2333
2334    if (parent == NULL) {
2335        xmlAddChild((xmlNodePtr) ctxt->myDoc, (xmlNodePtr) ret);
2336    }
2337    /*
2338     * Build the namespace list
2339     */
2340    for (i = 0,j = 0;j < nb_namespaces;j++) {
2341        pref = namespaces[i++];
2342	uri = namespaces[i++];
2343	ns = xmlNewNs(NULL, uri, pref);
2344	if (ns != NULL) {
2345	    if (last == NULL) {
2346	        ret->nsDef = last = ns;
2347	    } else {
2348	        last->next = ns;
2349		last = ns;
2350	    }
2351	    if ((URI != NULL) && (prefix == pref))
2352		ret->ns = ns;
2353	} else {
2354            /*
2355             * any out of memory error would already have been raised
2356             * but we can't be garanteed it's the actual error due to the
2357             * API, best is to skip in this case
2358             */
2359	    continue;
2360	}
2361#ifdef LIBXML_VALID_ENABLED
2362	if ((!ctxt->html) && ctxt->validate && ctxt->wellFormed &&
2363	    ctxt->myDoc && ctxt->myDoc->intSubset) {
2364	    ctxt->valid &= xmlValidateOneNamespace(&ctxt->vctxt, ctxt->myDoc,
2365	                                           ret, prefix, ns, uri);
2366	}
2367#endif /* LIBXML_VALID_ENABLED */
2368    }
2369    ctxt->nodemem = -1;
2370
2371    /*
2372     * We are parsing a new node.
2373     */
2374    nodePush(ctxt, ret);
2375
2376    /*
2377     * Link the child element
2378     */
2379    if (parent != NULL) {
2380        if (parent->type == XML_ELEMENT_NODE) {
2381	    xmlAddChild(parent, ret);
2382	} else {
2383	    xmlAddSibling(parent, ret);
2384	}
2385    }
2386
2387    /*
2388     * Insert the defaulted attributes from the DTD only if requested:
2389     */
2390    if ((nb_defaulted != 0) &&
2391        ((ctxt->loadsubset & XML_COMPLETE_ATTRS) == 0))
2392	nb_attributes -= nb_defaulted;
2393
2394    /*
2395     * Search the namespace if it wasn't already found
2396     * Note that, if prefix is NULL, this searches for the default Ns
2397     */
2398    if ((URI != NULL) && (ret->ns == NULL)) {
2399        ret->ns = xmlSearchNs(ctxt->myDoc, parent, prefix);
2400	if ((ret->ns == NULL) && (xmlStrEqual(prefix, BAD_CAST "xml"))) {
2401	    ret->ns = xmlSearchNs(ctxt->myDoc, ret, prefix);
2402	}
2403	if (ret->ns == NULL) {
2404	    ns = xmlNewNs(ret, NULL, prefix);
2405	    if (ns == NULL) {
2406
2407	        xmlSAX2ErrMemory(ctxt, "xmlSAX2StartElementNs");
2408		return;
2409	    }
2410            if (prefix != NULL)
2411                xmlNsWarnMsg(ctxt, XML_NS_ERR_UNDEFINED_NAMESPACE,
2412                             "Namespace prefix %s was not found\n",
2413                             prefix, NULL);
2414            else
2415                xmlNsWarnMsg(ctxt, XML_NS_ERR_UNDEFINED_NAMESPACE,
2416                             "Namespace default prefix was not found\n",
2417                             NULL, NULL);
2418	}
2419    }
2420
2421    /*
2422     * process all the other attributes
2423     */
2424    if (nb_attributes > 0) {
2425        for (j = 0,i = 0;i < nb_attributes;i++,j+=5) {
2426	    /*
2427	     * Handle the rare case of an undefined atribute prefix
2428	     */
2429	    if ((attributes[j+1] != NULL) && (attributes[j+2] == NULL)) {
2430		if (ctxt->dictNames) {
2431		    const xmlChar *fullname;
2432
2433		    fullname = xmlDictQLookup(ctxt->dict, attributes[j+1],
2434		                              attributes[j]);
2435		    if (fullname != NULL) {
2436			xmlSAX2AttributeNs(ctxt, fullname, NULL,
2437			                   attributes[j+3], attributes[j+4]);
2438		        continue;
2439		    }
2440		} else {
2441		    lname = xmlBuildQName(attributes[j], attributes[j+1],
2442		                          NULL, 0);
2443		    if (lname != NULL) {
2444			xmlSAX2AttributeNs(ctxt, lname, NULL,
2445			                   attributes[j+3], attributes[j+4]);
2446			xmlFree(lname);
2447		        continue;
2448		    }
2449		}
2450	    }
2451	    xmlSAX2AttributeNs(ctxt, attributes[j], attributes[j+1],
2452			       attributes[j+3], attributes[j+4]);
2453	}
2454    }
2455
2456#ifdef LIBXML_VALID_ENABLED
2457    /*
2458     * If it's the Document root, finish the DTD validation and
2459     * check the document root element for validity
2460     */
2461    if ((ctxt->validate) && (ctxt->vctxt.finishDtd == XML_CTXT_FINISH_DTD_0)) {
2462	int chk;
2463
2464	chk = xmlValidateDtdFinal(&ctxt->vctxt, ctxt->myDoc);
2465	if (chk <= 0)
2466	    ctxt->valid = 0;
2467	if (chk < 0)
2468	    ctxt->wellFormed = 0;
2469	ctxt->valid &= xmlValidateRoot(&ctxt->vctxt, ctxt->myDoc);
2470	ctxt->vctxt.finishDtd = XML_CTXT_FINISH_DTD_1;
2471    }
2472#endif /* LIBXML_VALID_ENABLED */
2473}
2474
2475/**
2476 * xmlSAX2EndElementNs:
2477 * @ctx:  the user data (XML parser context)
2478 * @localname:  the local name of the element
2479 * @prefix:  the element namespace prefix if available
2480 * @URI:  the element namespace name if available
2481 *
2482 * SAX2 callback when an element end has been detected by the parser.
2483 * It provides the namespace informations for the element.
2484 */
2485void
2486xmlSAX2EndElementNs(void *ctx,
2487                    const xmlChar * localname ATTRIBUTE_UNUSED,
2488                    const xmlChar * prefix ATTRIBUTE_UNUSED,
2489		    const xmlChar * URI ATTRIBUTE_UNUSED)
2490{
2491    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
2492    xmlParserNodeInfo node_info;
2493    xmlNodePtr cur;
2494
2495    if (ctx == NULL) return;
2496    cur = ctxt->node;
2497    /* Capture end position and add node */
2498    if ((ctxt->record_info) && (cur != NULL)) {
2499        node_info.end_pos = ctxt->input->cur - ctxt->input->base;
2500        node_info.end_line = ctxt->input->line;
2501        node_info.node = cur;
2502        xmlParserAddNodeInfo(ctxt, &node_info);
2503    }
2504    ctxt->nodemem = -1;
2505
2506#ifdef LIBXML_VALID_ENABLED
2507    if (ctxt->validate && ctxt->wellFormed &&
2508        ctxt->myDoc && ctxt->myDoc->intSubset)
2509        ctxt->valid &= xmlValidateOneElement(&ctxt->vctxt, ctxt->myDoc, cur);
2510#endif /* LIBXML_VALID_ENABLED */
2511
2512    /*
2513     * end of parsing of this node.
2514     */
2515    nodePop(ctxt);
2516}
2517
2518/**
2519 * xmlSAX2Reference:
2520 * @ctx: the user data (XML parser context)
2521 * @name:  The entity name
2522 *
2523 * called when an entity xmlSAX2Reference is detected.
2524 */
2525void
2526xmlSAX2Reference(void *ctx, const xmlChar *name)
2527{
2528    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
2529    xmlNodePtr ret;
2530
2531    if (ctx == NULL) return;
2532#ifdef DEBUG_SAX
2533    xmlGenericError(xmlGenericErrorContext,
2534	    "SAX.xmlSAX2Reference(%s)\n", name);
2535#endif
2536    if (name[0] == '#')
2537	ret = xmlNewCharRef(ctxt->myDoc, name);
2538    else
2539	ret = xmlNewReference(ctxt->myDoc, name);
2540#ifdef DEBUG_SAX_TREE
2541    xmlGenericError(xmlGenericErrorContext,
2542	    "add xmlSAX2Reference %s to %s \n", name, ctxt->node->name);
2543#endif
2544    if (xmlAddChild(ctxt->node, ret) == NULL) {
2545        xmlFreeNode(ret);
2546    }
2547}
2548
2549/**
2550 * xmlSAX2Characters:
2551 * @ctx: the user data (XML parser context)
2552 * @ch:  a xmlChar string
2553 * @len: the number of xmlChar
2554 *
2555 * receiving some chars from the parser.
2556 */
2557void
2558xmlSAX2Characters(void *ctx, const xmlChar *ch, int len)
2559{
2560    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
2561    xmlNodePtr lastChild;
2562
2563    if (ctx == NULL) return;
2564#ifdef DEBUG_SAX
2565    xmlGenericError(xmlGenericErrorContext,
2566	    "SAX.xmlSAX2Characters(%.30s, %d)\n", ch, len);
2567#endif
2568    /*
2569     * Handle the data if any. If there is no child
2570     * add it as content, otherwise if the last child is text,
2571     * concatenate it, else create a new node of type text.
2572     */
2573
2574    if (ctxt->node == NULL) {
2575#ifdef DEBUG_SAX_TREE
2576	xmlGenericError(xmlGenericErrorContext,
2577		"add chars: ctxt->node == NULL !\n");
2578#endif
2579        return;
2580    }
2581    lastChild = ctxt->node->last;
2582#ifdef DEBUG_SAX_TREE
2583    xmlGenericError(xmlGenericErrorContext,
2584	    "add chars to %s \n", ctxt->node->name);
2585#endif
2586
2587    /*
2588     * Here we needed an accelerator mechanism in case of very large
2589     * elements. Use an attribute in the structure !!!
2590     */
2591    if (lastChild == NULL) {
2592        lastChild = xmlSAX2TextNode(ctxt, ch, len);
2593	if (lastChild != NULL) {
2594	    ctxt->node->children = lastChild;
2595	    ctxt->node->last = lastChild;
2596	    lastChild->parent = ctxt->node;
2597	    lastChild->doc = ctxt->node->doc;
2598	    ctxt->nodelen = len;
2599	    ctxt->nodemem = len + 1;
2600	} else {
2601	    xmlSAX2ErrMemory(ctxt, "xmlSAX2Characters");
2602	    return;
2603	}
2604    } else {
2605	int coalesceText = (lastChild != NULL) &&
2606	    (lastChild->type == XML_TEXT_NODE) &&
2607	    (lastChild->name == xmlStringText);
2608	if ((coalesceText) && (ctxt->nodemem != 0)) {
2609	    /*
2610	     * The whole point of maintaining nodelen and nodemem,
2611	     * xmlTextConcat is too costly, i.e. compute length,
2612	     * reallocate a new buffer, move data, append ch. Here
2613	     * We try to minimaze realloc() uses and avoid copying
2614	     * and recomputing length over and over.
2615	     */
2616	    if (lastChild->content == (xmlChar *)&(lastChild->properties)) {
2617		lastChild->content = xmlStrdup(lastChild->content);
2618		lastChild->properties = NULL;
2619	    } else if ((ctxt->nodemem == ctxt->nodelen + 1) &&
2620	               (xmlDictOwns(ctxt->dict, lastChild->content))) {
2621		lastChild->content = xmlStrdup(lastChild->content);
2622	    }
2623            if (((size_t)ctxt->nodelen + (size_t)len > XML_MAX_TEXT_LENGTH) &&
2624                ((ctxt->options & XML_PARSE_HUGE) == 0)) {
2625                xmlSAX2ErrMemory(ctxt, "xmlSAX2Characters: huge text node");
2626                return;
2627            }
2628	    if ((size_t)ctxt->nodelen > SIZE_T_MAX - (size_t)len ||
2629	        (size_t)ctxt->nodemem + (size_t)len > SIZE_T_MAX / 2) {
2630                xmlSAX2ErrMemory(ctxt, "xmlSAX2Characters overflow prevented");
2631                return;
2632	    }
2633	    if (ctxt->nodelen + len >= ctxt->nodemem) {
2634		xmlChar *newbuf;
2635		size_t size;
2636
2637		size = ctxt->nodemem + len;
2638		size *= 2;
2639                newbuf = (xmlChar *) xmlRealloc(lastChild->content,size);
2640		if (newbuf == NULL) {
2641		    xmlSAX2ErrMemory(ctxt, "xmlSAX2Characters");
2642		    return;
2643		}
2644		ctxt->nodemem = size;
2645		lastChild->content = newbuf;
2646	    }
2647	    memcpy(&lastChild->content[ctxt->nodelen], ch, len);
2648	    ctxt->nodelen += len;
2649	    lastChild->content[ctxt->nodelen] = 0;
2650	} else if (coalesceText) {
2651	    if (xmlTextConcat(lastChild, ch, len)) {
2652		xmlSAX2ErrMemory(ctxt, "xmlSAX2Characters");
2653	    }
2654	    if (ctxt->node->children != NULL) {
2655		ctxt->nodelen = xmlStrlen(lastChild->content);
2656		ctxt->nodemem = ctxt->nodelen + 1;
2657	    }
2658	} else {
2659	    /* Mixed content, first time */
2660	    lastChild = xmlSAX2TextNode(ctxt, ch, len);
2661	    if (lastChild != NULL) {
2662		xmlAddChild(ctxt->node, lastChild);
2663		if (ctxt->node->children != NULL) {
2664		    ctxt->nodelen = len;
2665		    ctxt->nodemem = len + 1;
2666		}
2667	    }
2668	}
2669    }
2670}
2671
2672/**
2673 * xmlSAX2IgnorableWhitespace:
2674 * @ctx: the user data (XML parser context)
2675 * @ch:  a xmlChar string
2676 * @len: the number of xmlChar
2677 *
2678 * receiving some ignorable whitespaces from the parser.
2679 * UNUSED: by default the DOM building will use xmlSAX2Characters
2680 */
2681void
2682xmlSAX2IgnorableWhitespace(void *ctx ATTRIBUTE_UNUSED, const xmlChar *ch ATTRIBUTE_UNUSED, int len ATTRIBUTE_UNUSED)
2683{
2684    /* xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx; */
2685#ifdef DEBUG_SAX
2686    xmlGenericError(xmlGenericErrorContext,
2687	    "SAX.xmlSAX2IgnorableWhitespace(%.30s, %d)\n", ch, len);
2688#endif
2689}
2690
2691/**
2692 * xmlSAX2ProcessingInstruction:
2693 * @ctx: the user data (XML parser context)
2694 * @target:  the target name
2695 * @data: the PI data's
2696 *
2697 * A processing instruction has been parsed.
2698 */
2699void
2700xmlSAX2ProcessingInstruction(void *ctx, const xmlChar *target,
2701                      const xmlChar *data)
2702{
2703    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
2704    xmlNodePtr ret;
2705    xmlNodePtr parent;
2706
2707    if (ctx == NULL) return;
2708    parent = ctxt->node;
2709#ifdef DEBUG_SAX
2710    xmlGenericError(xmlGenericErrorContext,
2711	    "SAX.xmlSAX2ProcessingInstruction(%s, %s)\n", target, data);
2712#endif
2713
2714    ret = xmlNewDocPI(ctxt->myDoc, target, data);
2715    if (ret == NULL) return;
2716
2717    if (ctxt->linenumbers) {
2718	if (ctxt->input != NULL) {
2719	    if (ctxt->input->line < 65535)
2720		ret->line = (short) ctxt->input->line;
2721	    else
2722	        ret->line = 65535;
2723	}
2724    }
2725    if (ctxt->inSubset == 1) {
2726	xmlAddChild((xmlNodePtr) ctxt->myDoc->intSubset, ret);
2727	return;
2728    } else if (ctxt->inSubset == 2) {
2729	xmlAddChild((xmlNodePtr) ctxt->myDoc->extSubset, ret);
2730	return;
2731    }
2732    if (parent == NULL) {
2733#ifdef DEBUG_SAX_TREE
2734	    xmlGenericError(xmlGenericErrorContext,
2735		    "Setting PI %s as root\n", target);
2736#endif
2737        xmlAddChild((xmlNodePtr) ctxt->myDoc, (xmlNodePtr) ret);
2738	return;
2739    }
2740    if (parent->type == XML_ELEMENT_NODE) {
2741#ifdef DEBUG_SAX_TREE
2742	xmlGenericError(xmlGenericErrorContext,
2743		"adding PI %s child to %s\n", target, parent->name);
2744#endif
2745	xmlAddChild(parent, ret);
2746    } else {
2747#ifdef DEBUG_SAX_TREE
2748	xmlGenericError(xmlGenericErrorContext,
2749		"adding PI %s sibling to ", target);
2750	xmlDebugDumpOneNode(stderr, parent, 0);
2751#endif
2752	xmlAddSibling(parent, ret);
2753    }
2754}
2755
2756/**
2757 * xmlSAX2Comment:
2758 * @ctx: the user data (XML parser context)
2759 * @value:  the xmlSAX2Comment content
2760 *
2761 * A xmlSAX2Comment has been parsed.
2762 */
2763void
2764xmlSAX2Comment(void *ctx, const xmlChar *value)
2765{
2766    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
2767    xmlNodePtr ret;
2768    xmlNodePtr parent;
2769
2770    if (ctx == NULL) return;
2771    parent = ctxt->node;
2772#ifdef DEBUG_SAX
2773    xmlGenericError(xmlGenericErrorContext, "SAX.xmlSAX2Comment(%s)\n", value);
2774#endif
2775    ret = xmlNewDocComment(ctxt->myDoc, value);
2776    if (ret == NULL) return;
2777    if (ctxt->linenumbers) {
2778	if (ctxt->input != NULL) {
2779	    if (ctxt->input->line < 65535)
2780		ret->line = (short) ctxt->input->line;
2781	    else
2782	        ret->line = 65535;
2783	}
2784    }
2785
2786    if (ctxt->inSubset == 1) {
2787	xmlAddChild((xmlNodePtr) ctxt->myDoc->intSubset, ret);
2788	return;
2789    } else if (ctxt->inSubset == 2) {
2790	xmlAddChild((xmlNodePtr) ctxt->myDoc->extSubset, ret);
2791	return;
2792    }
2793    if (parent == NULL) {
2794#ifdef DEBUG_SAX_TREE
2795	    xmlGenericError(xmlGenericErrorContext,
2796		    "Setting xmlSAX2Comment as root\n");
2797#endif
2798        xmlAddChild((xmlNodePtr) ctxt->myDoc, (xmlNodePtr) ret);
2799	return;
2800    }
2801    if (parent->type == XML_ELEMENT_NODE) {
2802#ifdef DEBUG_SAX_TREE
2803	xmlGenericError(xmlGenericErrorContext,
2804		"adding xmlSAX2Comment child to %s\n", parent->name);
2805#endif
2806	xmlAddChild(parent, ret);
2807    } else {
2808#ifdef DEBUG_SAX_TREE
2809	xmlGenericError(xmlGenericErrorContext,
2810		"adding xmlSAX2Comment sibling to ");
2811	xmlDebugDumpOneNode(stderr, parent, 0);
2812#endif
2813	xmlAddSibling(parent, ret);
2814    }
2815}
2816
2817/**
2818 * xmlSAX2CDataBlock:
2819 * @ctx: the user data (XML parser context)
2820 * @value:  The pcdata content
2821 * @len:  the block length
2822 *
2823 * called when a pcdata block has been parsed
2824 */
2825void
2826xmlSAX2CDataBlock(void *ctx, const xmlChar *value, int len)
2827{
2828    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
2829    xmlNodePtr ret, lastChild;
2830
2831    if (ctx == NULL) return;
2832#ifdef DEBUG_SAX
2833    xmlGenericError(xmlGenericErrorContext,
2834	    "SAX.pcdata(%.10s, %d)\n", value, len);
2835#endif
2836    lastChild = xmlGetLastChild(ctxt->node);
2837#ifdef DEBUG_SAX_TREE
2838    xmlGenericError(xmlGenericErrorContext,
2839	    "add chars to %s \n", ctxt->node->name);
2840#endif
2841    if ((lastChild != NULL) &&
2842        (lastChild->type == XML_CDATA_SECTION_NODE)) {
2843	xmlTextConcat(lastChild, value, len);
2844    } else {
2845	ret = xmlNewCDataBlock(ctxt->myDoc, value, len);
2846	xmlAddChild(ctxt->node, ret);
2847    }
2848}
2849
2850static int xmlSAX2DefaultVersionValue = 2;
2851
2852#ifdef LIBXML_SAX1_ENABLED
2853/**
2854 * xmlSAXDefaultVersion:
2855 * @version:  the version, 1 or 2
2856 *
2857 * Set the default version of SAX used globally by the library.
2858 * By default, during initialization the default is set to 2.
2859 * Note that it is generally a better coding style to use
2860 * xmlSAXVersion() to set up the version explicitly for a given
2861 * parsing context.
2862 *
2863 * Returns the previous value in case of success and -1 in case of error.
2864 */
2865int
2866xmlSAXDefaultVersion(int version)
2867{
2868    int ret = xmlSAX2DefaultVersionValue;
2869
2870    if ((version != 1) && (version != 2))
2871        return(-1);
2872    xmlSAX2DefaultVersionValue = version;
2873    return(ret);
2874}
2875#endif /* LIBXML_SAX1_ENABLED */
2876
2877/**
2878 * xmlSAXVersion:
2879 * @hdlr:  the SAX handler
2880 * @version:  the version, 1 or 2
2881 *
2882 * Initialize the default XML SAX handler according to the version
2883 *
2884 * Returns 0 in case of success and -1 in case of error.
2885 */
2886int
2887xmlSAXVersion(xmlSAXHandler *hdlr, int version)
2888{
2889    if (hdlr == NULL) return(-1);
2890    if (version == 2) {
2891	hdlr->startElement = NULL;
2892	hdlr->endElement = NULL;
2893	hdlr->startElementNs = xmlSAX2StartElementNs;
2894	hdlr->endElementNs = xmlSAX2EndElementNs;
2895	hdlr->serror = NULL;
2896	hdlr->initialized = XML_SAX2_MAGIC;
2897#ifdef LIBXML_SAX1_ENABLED
2898    } else if (version == 1) {
2899	hdlr->startElement = xmlSAX2StartElement;
2900	hdlr->endElement = xmlSAX2EndElement;
2901	hdlr->initialized = 1;
2902#endif /* LIBXML_SAX1_ENABLED */
2903    } else
2904        return(-1);
2905    hdlr->internalSubset = xmlSAX2InternalSubset;
2906    hdlr->externalSubset = xmlSAX2ExternalSubset;
2907    hdlr->isStandalone = xmlSAX2IsStandalone;
2908    hdlr->hasInternalSubset = xmlSAX2HasInternalSubset;
2909    hdlr->hasExternalSubset = xmlSAX2HasExternalSubset;
2910    hdlr->resolveEntity = xmlSAX2ResolveEntity;
2911    hdlr->getEntity = xmlSAX2GetEntity;
2912    hdlr->getParameterEntity = xmlSAX2GetParameterEntity;
2913    hdlr->entityDecl = xmlSAX2EntityDecl;
2914    hdlr->attributeDecl = xmlSAX2AttributeDecl;
2915    hdlr->elementDecl = xmlSAX2ElementDecl;
2916    hdlr->notationDecl = xmlSAX2NotationDecl;
2917    hdlr->unparsedEntityDecl = xmlSAX2UnparsedEntityDecl;
2918    hdlr->setDocumentLocator = xmlSAX2SetDocumentLocator;
2919    hdlr->startDocument = xmlSAX2StartDocument;
2920    hdlr->endDocument = xmlSAX2EndDocument;
2921    hdlr->reference = xmlSAX2Reference;
2922    hdlr->characters = xmlSAX2Characters;
2923    hdlr->cdataBlock = xmlSAX2CDataBlock;
2924    hdlr->ignorableWhitespace = xmlSAX2Characters;
2925    hdlr->processingInstruction = xmlSAX2ProcessingInstruction;
2926    hdlr->comment = xmlSAX2Comment;
2927    hdlr->warning = xmlParserWarning;
2928    hdlr->error = xmlParserError;
2929    hdlr->fatalError = xmlParserError;
2930
2931    return(0);
2932}
2933
2934/**
2935 * xmlSAX2InitDefaultSAXHandler:
2936 * @hdlr:  the SAX handler
2937 * @warning:  flag if non-zero sets the handler warning procedure
2938 *
2939 * Initialize the default XML SAX2 handler
2940 */
2941void
2942xmlSAX2InitDefaultSAXHandler(xmlSAXHandler *hdlr, int warning)
2943{
2944    if ((hdlr == NULL) || (hdlr->initialized != 0))
2945	return;
2946
2947    xmlSAXVersion(hdlr, xmlSAX2DefaultVersionValue);
2948    if (warning == 0)
2949	hdlr->warning = NULL;
2950    else
2951	hdlr->warning = xmlParserWarning;
2952}
2953
2954/**
2955 * xmlDefaultSAXHandlerInit:
2956 *
2957 * Initialize the default SAX2 handler
2958 */
2959void
2960xmlDefaultSAXHandlerInit(void)
2961{
2962#ifdef LIBXML_SAX1_ENABLED
2963    xmlSAXVersion((xmlSAXHandlerPtr) &xmlDefaultSAXHandler, 1);
2964#endif /* LIBXML_SAX1_ENABLED */
2965}
2966
2967#ifdef LIBXML_HTML_ENABLED
2968
2969/**
2970 * xmlSAX2InitHtmlDefaultSAXHandler:
2971 * @hdlr:  the SAX handler
2972 *
2973 * Initialize the default HTML SAX2 handler
2974 */
2975void
2976xmlSAX2InitHtmlDefaultSAXHandler(xmlSAXHandler *hdlr)
2977{
2978    if ((hdlr == NULL) || (hdlr->initialized != 0))
2979	return;
2980
2981    hdlr->internalSubset = xmlSAX2InternalSubset;
2982    hdlr->externalSubset = NULL;
2983    hdlr->isStandalone = NULL;
2984    hdlr->hasInternalSubset = NULL;
2985    hdlr->hasExternalSubset = NULL;
2986    hdlr->resolveEntity = NULL;
2987    hdlr->getEntity = xmlSAX2GetEntity;
2988    hdlr->getParameterEntity = NULL;
2989    hdlr->entityDecl = NULL;
2990    hdlr->attributeDecl = NULL;
2991    hdlr->elementDecl = NULL;
2992    hdlr->notationDecl = NULL;
2993    hdlr->unparsedEntityDecl = NULL;
2994    hdlr->setDocumentLocator = xmlSAX2SetDocumentLocator;
2995    hdlr->startDocument = xmlSAX2StartDocument;
2996    hdlr->endDocument = xmlSAX2EndDocument;
2997    hdlr->startElement = xmlSAX2StartElement;
2998    hdlr->endElement = xmlSAX2EndElement;
2999    hdlr->reference = NULL;
3000    hdlr->characters = xmlSAX2Characters;
3001    hdlr->cdataBlock = xmlSAX2CDataBlock;
3002    hdlr->ignorableWhitespace = xmlSAX2IgnorableWhitespace;
3003    hdlr->processingInstruction = xmlSAX2ProcessingInstruction;
3004    hdlr->comment = xmlSAX2Comment;
3005    hdlr->warning = xmlParserWarning;
3006    hdlr->error = xmlParserError;
3007    hdlr->fatalError = xmlParserError;
3008
3009    hdlr->initialized = 1;
3010}
3011
3012/**
3013 * htmlDefaultSAXHandlerInit:
3014 *
3015 * Initialize the default SAX handler
3016 */
3017void
3018htmlDefaultSAXHandlerInit(void)
3019{
3020    xmlSAX2InitHtmlDefaultSAXHandler((xmlSAXHandlerPtr) &htmlDefaultSAXHandler);
3021}
3022
3023#endif /* LIBXML_HTML_ENABLED */
3024
3025#ifdef LIBXML_DOCB_ENABLED
3026
3027/**
3028 * xmlSAX2InitDocbDefaultSAXHandler:
3029 * @hdlr:  the SAX handler
3030 *
3031 * Initialize the default DocBook SAX2 handler
3032 */
3033void
3034xmlSAX2InitDocbDefaultSAXHandler(xmlSAXHandler *hdlr)
3035{
3036    if ((hdlr == NULL) || (hdlr->initialized != 0))
3037	return;
3038
3039    hdlr->internalSubset = xmlSAX2InternalSubset;
3040    hdlr->externalSubset = NULL;
3041    hdlr->isStandalone = xmlSAX2IsStandalone;
3042    hdlr->hasInternalSubset = xmlSAX2HasInternalSubset;
3043    hdlr->hasExternalSubset = xmlSAX2HasExternalSubset;
3044    hdlr->resolveEntity = xmlSAX2ResolveEntity;
3045    hdlr->getEntity = xmlSAX2GetEntity;
3046    hdlr->getParameterEntity = NULL;
3047    hdlr->entityDecl = xmlSAX2EntityDecl;
3048    hdlr->attributeDecl = NULL;
3049    hdlr->elementDecl = NULL;
3050    hdlr->notationDecl = NULL;
3051    hdlr->unparsedEntityDecl = NULL;
3052    hdlr->setDocumentLocator = xmlSAX2SetDocumentLocator;
3053    hdlr->startDocument = xmlSAX2StartDocument;
3054    hdlr->endDocument = xmlSAX2EndDocument;
3055    hdlr->startElement = xmlSAX2StartElement;
3056    hdlr->endElement = xmlSAX2EndElement;
3057    hdlr->reference = xmlSAX2Reference;
3058    hdlr->characters = xmlSAX2Characters;
3059    hdlr->cdataBlock = NULL;
3060    hdlr->ignorableWhitespace = xmlSAX2IgnorableWhitespace;
3061    hdlr->processingInstruction = NULL;
3062    hdlr->comment = xmlSAX2Comment;
3063    hdlr->warning = xmlParserWarning;
3064    hdlr->error = xmlParserError;
3065    hdlr->fatalError = xmlParserError;
3066
3067    hdlr->initialized = 1;
3068}
3069
3070/**
3071 * docbDefaultSAXHandlerInit:
3072 *
3073 * Initialize the default SAX handler
3074 */
3075void
3076docbDefaultSAXHandlerInit(void)
3077{
3078    xmlSAX2InitDocbDefaultSAXHandler((xmlSAXHandlerPtr) &docbDefaultSAXHandler);
3079}
3080
3081#endif /* LIBXML_DOCB_ENABLED */
3082#define bottom_SAX2
3083#include "elfgcchack.h"
3084