2 * "Canonical XML" implementation
3 * http://www.w3.org/TR/xml-c14n
5 * "Exclusive XML Canonicalization" implementation
6 * http://www.w3.org/TR/xml-exc-c14n
8 * See Copyright for the status of this software.
10 * Author: Aleksey Sanin <aleksey@aleksey.com>
14 #ifdef LIBXML_C14N_ENABLED
15 #ifdef LIBXML_OUTPUT_ENABLED
22 #include <libxml/tree.h>
23 #include <libxml/parser.h>
24 #include <libxml/uri.h>
25 #include <libxml/xmlerror.h>
26 #include <libxml/globals.h>
27 #include <libxml/xpathInternals.h>
28 #include <libxml/c14n.h>
32 /************************************************************************
34 * Some declaration better left private ATM *
36 ************************************************************************/
39 XMLC14N_BEFORE_DOCUMENT_ELEMENT
= 0,
40 XMLC14N_INSIDE_DOCUMENT_ELEMENT
= 1,
41 XMLC14N_AFTER_DOCUMENT_ELEMENT
= 2
44 typedef struct _xmlC14NVisibleNsStack
{
45 int nsCurEnd
; /* number of nodes in the set */
46 int nsPrevStart
; /* the begginning of the stack for previous visible node */
47 int nsPrevEnd
; /* the end of the stack for previous visible node */
48 int nsMax
; /* size of the array as allocated */
49 xmlNsPtr
*nsTab
; /* array of ns in no particular order */
50 xmlNodePtr
*nodeTab
; /* array of nodes in no particular order */
51 } xmlC14NVisibleNsStack
, *xmlC14NVisibleNsStackPtr
;
53 typedef struct _xmlC14NCtx
{
54 /* input parameters */
56 xmlC14NIsVisibleCallback is_visible_callback
;
59 xmlOutputBufferPtr buf
;
61 /* position in the XML document */
64 xmlC14NVisibleNsStackPtr ns_rendered
;
69 /* exclusive canonicalization */
70 xmlChar
**inclusive_ns_prefixes
;
74 } xmlC14NCtx
, *xmlC14NCtxPtr
;
76 static xmlC14NVisibleNsStackPtr
xmlC14NVisibleNsStackCreate (void);
77 static void xmlC14NVisibleNsStackDestroy (xmlC14NVisibleNsStackPtr cur
);
78 static void xmlC14NVisibleNsStackAdd (xmlC14NVisibleNsStackPtr cur
,
81 static void xmlC14NVisibleNsStackSave (xmlC14NVisibleNsStackPtr cur
,
82 xmlC14NVisibleNsStackPtr state
);
83 static void xmlC14NVisibleNsStackRestore (xmlC14NVisibleNsStackPtr cur
,
84 xmlC14NVisibleNsStackPtr state
);
85 static void xmlC14NVisibleNsStackShift (xmlC14NVisibleNsStackPtr cur
);
86 static int xmlC14NVisibleNsStackFind (xmlC14NVisibleNsStackPtr cur
,
88 static int xmlExcC14NVisibleNsStackFind (xmlC14NVisibleNsStackPtr cur
,
92 static int xmlC14NIsNodeInNodeset (xmlNodeSetPtr nodes
,
98 static int xmlC14NProcessNode(xmlC14NCtxPtr ctx
, xmlNodePtr cur
);
99 static int xmlC14NProcessNodeList(xmlC14NCtxPtr ctx
, xmlNodePtr cur
);
101 XMLC14N_NORMALIZE_ATTR
= 0,
102 XMLC14N_NORMALIZE_COMMENT
= 1,
103 XMLC14N_NORMALIZE_PI
= 2,
104 XMLC14N_NORMALIZE_TEXT
= 3
105 } xmlC14NNormalizationMode
;
107 static xmlChar
*xmlC11NNormalizeString(const xmlChar
* input
,
108 xmlC14NNormalizationMode mode
);
110 #define xmlC11NNormalizeAttr( a ) \
111 xmlC11NNormalizeString((a), XMLC14N_NORMALIZE_ATTR)
112 #define xmlC11NNormalizeComment( a ) \
113 xmlC11NNormalizeString((a), XMLC14N_NORMALIZE_COMMENT)
114 #define xmlC11NNormalizePI( a ) \
115 xmlC11NNormalizeString((a), XMLC14N_NORMALIZE_PI)
116 #define xmlC11NNormalizeText( a ) \
117 xmlC11NNormalizeString((a), XMLC14N_NORMALIZE_TEXT)
119 #define xmlC14NIsVisible( ctx, node, parent ) \
120 (((ctx)->is_visible_callback != NULL) ? \
121 (ctx)->is_visible_callback((ctx)->user_data, \
122 (xmlNodePtr)(node), (xmlNodePtr)(parent)) : 1)
124 #define xmlC14NIsExclusive( ctx ) \
125 ( (ctx)->mode == XML_C14N_EXCLUSIVE_1_0 )
127 /************************************************************************
129 * Some factorized error routines *
131 ************************************************************************/
135 * @extra: extra informations
137 * Handle a redefinition of memory error
140 xmlC14NErrMemory(const char *extra
)
142 __xmlRaiseError(NULL
, NULL
, NULL
, NULL
, NULL
, XML_FROM_C14N
,
143 XML_ERR_NO_MEMORY
, XML_ERR_ERROR
, NULL
, 0, extra
,
145 "Memory allocation failed : %s\n", extra
);
150 * @extra: extra informations
152 * Handle a redefinition of param error
155 xmlC14NErrParam(const char *extra
)
157 __xmlRaiseError(NULL
, NULL
, NULL
, NULL
, NULL
, XML_FROM_C14N
,
158 XML_ERR_INTERNAL_ERROR
, XML_ERR_ERROR
, NULL
, 0, extra
,
160 "Invalid parameter : %s\n", extra
);
164 * xmlC14NErrInternal:
165 * @extra: extra informations
167 * Handle a redefinition of internal error
170 xmlC14NErrInternal(const char *extra
)
172 __xmlRaiseError(NULL
, NULL
, NULL
, NULL
, NULL
, XML_FROM_C14N
,
173 XML_ERR_INTERNAL_ERROR
, XML_ERR_ERROR
, NULL
, 0, extra
,
175 "Internal error : %s\n", extra
);
179 * xmlC14NErrInvalidNode:
180 * @extra: extra informations
182 * Handle a redefinition of invalid node error
185 xmlC14NErrInvalidNode(const char *node_type
, const char *extra
)
187 __xmlRaiseError(NULL
, NULL
, NULL
, NULL
, NULL
, XML_FROM_C14N
,
188 XML_C14N_INVALID_NODE
, XML_ERR_ERROR
, NULL
, 0, extra
,
190 "Node %s is invalid here : %s\n", node_type
, extra
);
194 * xmlC14NErrUnknownNode:
195 * @extra: extra informations
197 * Handle a redefinition of unknown node error
200 xmlC14NErrUnknownNode(int node_type
, const char *extra
)
202 __xmlRaiseError(NULL
, NULL
, NULL
, NULL
, NULL
, XML_FROM_C14N
,
203 XML_C14N_UNKNOW_NODE
, XML_ERR_ERROR
, NULL
, 0, extra
,
205 "Unknown node type %d found : %s\n", node_type
, extra
);
209 * xmlC14NErrRelativeNamespace:
210 * @extra: extra informations
212 * Handle a redefinition of relative namespace error
215 xmlC14NErrRelativeNamespace(const char *ns_uri
)
217 __xmlRaiseError(NULL
, NULL
, NULL
, NULL
, NULL
, XML_FROM_C14N
,
218 XML_C14N_RELATIVE_NAMESPACE
, XML_ERR_ERROR
, NULL
, 0, NULL
,
220 "Relative namespace UR is invalid here : %s\n", ns_uri
);
227 * @ctxt: a C14N evaluation context
228 * @node: the context node
229 * @error: the erorr code
231 * @extra: extra informations
233 * Handle a redefinition of attribute error
236 xmlC14NErr(xmlC14NCtxPtr ctxt
, xmlNodePtr node
, int error
,
241 __xmlRaiseError(NULL
, NULL
, NULL
,
242 ctxt
, node
, XML_FROM_C14N
, error
,
243 XML_ERR_ERROR
, NULL
, 0,
244 NULL
, NULL
, NULL
, 0, 0, "%s", msg
);
247 /************************************************************************
249 * The implementation internals *
251 ************************************************************************/
252 #define XML_NAMESPACES_DEFAULT 16
255 xmlC14NIsNodeInNodeset(xmlNodeSetPtr nodes
, xmlNodePtr node
, xmlNodePtr parent
) {
256 if((nodes
!= NULL
) && (node
!= NULL
)) {
257 if(node
->type
!= XML_NAMESPACE_DECL
) {
258 return(xmlXPathNodeSetContains(nodes
, node
));
262 memcpy(&ns
, node
, sizeof(ns
));
264 /* this is a libxml hack! check xpath.c for details */
265 if((parent
!= NULL
) && (parent
->type
== XML_ATTRIBUTE_NODE
)) {
266 ns
.next
= (xmlNsPtr
)parent
->parent
;
268 ns
.next
= (xmlNsPtr
)parent
;
272 * If the input is an XPath node-set, then the node-set must explicitly
273 * contain every node to be rendered to the canonical form.
275 return(xmlXPathNodeSetContains(nodes
, (xmlNodePtr
)&ns
));
281 static xmlC14NVisibleNsStackPtr
282 xmlC14NVisibleNsStackCreate(void) {
283 xmlC14NVisibleNsStackPtr ret
;
285 ret
= (xmlC14NVisibleNsStackPtr
) xmlMalloc(sizeof(xmlC14NVisibleNsStack
));
287 xmlC14NErrMemory("creating namespaces stack");
290 memset(ret
, 0 , (size_t) sizeof(xmlC14NVisibleNsStack
));
295 xmlC14NVisibleNsStackDestroy(xmlC14NVisibleNsStackPtr cur
) {
297 xmlC14NErrParam("destroying namespaces stack");
300 if(cur
->nsTab
!= NULL
) {
301 memset(cur
->nsTab
, 0, cur
->nsMax
* sizeof(xmlNsPtr
));
304 if(cur
->nodeTab
!= NULL
) {
305 memset(cur
->nodeTab
, 0, cur
->nsMax
* sizeof(xmlNodePtr
));
306 xmlFree(cur
->nodeTab
);
308 memset(cur
, 0, sizeof(xmlC14NVisibleNsStack
));
314 xmlC14NVisibleNsStackAdd(xmlC14NVisibleNsStackPtr cur
, xmlNsPtr ns
, xmlNodePtr node
) {
316 ((cur
->nsTab
== NULL
) && (cur
->nodeTab
!= NULL
)) ||
317 ((cur
->nsTab
!= NULL
) && (cur
->nodeTab
== NULL
))) {
318 xmlC14NErrParam("adding namespace to stack");
322 if ((cur
->nsTab
== NULL
) && (cur
->nodeTab
== NULL
)) {
323 cur
->nsTab
= (xmlNsPtr
*) xmlMalloc(XML_NAMESPACES_DEFAULT
* sizeof(xmlNsPtr
));
324 cur
->nodeTab
= (xmlNodePtr
*) xmlMalloc(XML_NAMESPACES_DEFAULT
* sizeof(xmlNodePtr
));
325 if ((cur
->nsTab
== NULL
) || (cur
->nodeTab
== NULL
)) {
326 xmlC14NErrMemory("adding node to stack");
329 memset(cur
->nsTab
, 0 , XML_NAMESPACES_DEFAULT
* sizeof(xmlNsPtr
));
330 memset(cur
->nodeTab
, 0 , XML_NAMESPACES_DEFAULT
* sizeof(xmlNodePtr
));
331 cur
->nsMax
= XML_NAMESPACES_DEFAULT
;
332 } else if(cur
->nsMax
== cur
->nsCurEnd
) {
336 tmpSize
= 2 * cur
->nsMax
;
337 tmp
= xmlRealloc(cur
->nsTab
, tmpSize
* sizeof(xmlNsPtr
));
339 xmlC14NErrMemory("adding node to stack");
342 cur
->nsTab
= (xmlNsPtr
*)tmp
;
344 tmp
= xmlRealloc(cur
->nodeTab
, tmpSize
* sizeof(xmlNodePtr
));
346 xmlC14NErrMemory("adding node to stack");
349 cur
->nodeTab
= (xmlNodePtr
*)tmp
;
351 cur
->nsMax
= tmpSize
;
353 cur
->nsTab
[cur
->nsCurEnd
] = ns
;
354 cur
->nodeTab
[cur
->nsCurEnd
] = node
;
360 xmlC14NVisibleNsStackSave(xmlC14NVisibleNsStackPtr cur
, xmlC14NVisibleNsStackPtr state
) {
361 if((cur
== NULL
) || (state
== NULL
)) {
362 xmlC14NErrParam("saving namespaces stack");
366 state
->nsCurEnd
= cur
->nsCurEnd
;
367 state
->nsPrevStart
= cur
->nsPrevStart
;
368 state
->nsPrevEnd
= cur
->nsPrevEnd
;
372 xmlC14NVisibleNsStackRestore(xmlC14NVisibleNsStackPtr cur
, xmlC14NVisibleNsStackPtr state
) {
373 if((cur
== NULL
) || (state
== NULL
)) {
374 xmlC14NErrParam("restoring namespaces stack");
377 cur
->nsCurEnd
= state
->nsCurEnd
;
378 cur
->nsPrevStart
= state
->nsPrevStart
;
379 cur
->nsPrevEnd
= state
->nsPrevEnd
;
383 xmlC14NVisibleNsStackShift(xmlC14NVisibleNsStackPtr cur
) {
385 xmlC14NErrParam("shifting namespaces stack");
388 cur
->nsPrevStart
= cur
->nsPrevEnd
;
389 cur
->nsPrevEnd
= cur
->nsCurEnd
;
393 xmlC14NStrEqual(const xmlChar
*str1
, const xmlChar
*str2
) {
394 if (str1
== str2
) return(1);
395 if (str1
== NULL
) return((*str2
) == '\0');
396 if (str2
== NULL
) return((*str1
) == '\0');
398 if (*str1
++ != *str2
) return(0);
404 * xmlC14NVisibleNsStackFind:
405 * @ctx: the C14N context
406 * @ns: the namespace to check
408 * Checks whether the given namespace was already rendered or not
410 * Returns 1 if we already wrote this namespace or 0 otherwise
413 xmlC14NVisibleNsStackFind(xmlC14NVisibleNsStackPtr cur
, xmlNsPtr ns
)
416 const xmlChar
*prefix
;
421 xmlC14NErrParam("searching namespaces stack (c14n)");
426 * if the default namespace xmlns="" is not defined yet then
427 * we do not want to print it out
429 prefix
= ((ns
== NULL
) || (ns
->prefix
== NULL
)) ? BAD_CAST
"" : ns
->prefix
;
430 href
= ((ns
== NULL
) || (ns
->href
== NULL
)) ? BAD_CAST
"" : ns
->href
;
431 has_empty_ns
= (xmlC14NStrEqual(prefix
, NULL
) && xmlC14NStrEqual(href
, NULL
));
433 if (cur
->nsTab
!= NULL
) {
434 int start
= (has_empty_ns
) ? 0 : cur
->nsPrevStart
;
435 for (i
= cur
->nsCurEnd
- 1; i
>= start
; --i
) {
436 xmlNsPtr ns1
= cur
->nsTab
[i
];
438 if(xmlC14NStrEqual(prefix
, (ns1
!= NULL
) ? ns1
->prefix
: NULL
)) {
439 return(xmlC14NStrEqual(href
, (ns1
!= NULL
) ? ns1
->href
: NULL
));
443 return(has_empty_ns
);
447 xmlExcC14NVisibleNsStackFind(xmlC14NVisibleNsStackPtr cur
, xmlNsPtr ns
, xmlC14NCtxPtr ctx
) {
449 const xmlChar
*prefix
;
454 xmlC14NErrParam("searching namespaces stack (exc c14n)");
459 * if the default namespace xmlns="" is not defined yet then
460 * we do not want to print it out
462 prefix
= ((ns
== NULL
) || (ns
->prefix
== NULL
)) ? BAD_CAST
"" : ns
->prefix
;
463 href
= ((ns
== NULL
) || (ns
->href
== NULL
)) ? BAD_CAST
"" : ns
->href
;
464 has_empty_ns
= (xmlC14NStrEqual(prefix
, NULL
) && xmlC14NStrEqual(href
, NULL
));
466 if (cur
->nsTab
!= NULL
) {
468 for (i
= cur
->nsCurEnd
- 1; i
>= start
; --i
) {
469 xmlNsPtr ns1
= cur
->nsTab
[i
];
471 if(xmlC14NStrEqual(prefix
, (ns1
!= NULL
) ? ns1
->prefix
: NULL
)) {
472 if(xmlC14NStrEqual(href
, (ns1
!= NULL
) ? ns1
->href
: NULL
)) {
473 return(xmlC14NIsVisible(ctx
, ns1
, cur
->nodeTab
[i
]));
480 return(has_empty_ns
);
488 * @ns: the namespace to check
490 * Checks whether the given namespace is a default "xml:" namespace
491 * with href="http://www.w3.org/XML/1998/namespace"
493 * Returns 1 if the node is default or 0 otherwise
496 /* todo: make it a define? */
498 xmlC14NIsXmlNs(xmlNsPtr ns
)
500 return ((ns
!= NULL
) &&
501 (xmlStrEqual(ns
->prefix
, BAD_CAST
"xml")) &&
502 (xmlStrEqual(ns
->href
, XML_XML_NAMESPACE
)));
508 * @ns1: the pointer to first namespace
509 * @ns2: the pointer to second namespace
511 * Compares the namespaces by names (prefixes).
513 * Returns -1 if ns1 < ns2, 0 if ns1 == ns2 or 1 if ns1 > ns2.
516 xmlC14NNsCompare(xmlNsPtr ns1
, xmlNsPtr ns2
)
525 return (xmlStrcmp(ns1
->prefix
, ns2
->prefix
));
530 * xmlC14NPrintNamespaces:
531 * @ns: the pointer to namespace
532 * @ctx: the C14N context
534 * Prints the given namespace to the output buffer from C14N context.
536 * Returns 1 on success or 0 on fail.
539 xmlC14NPrintNamespaces(const xmlNsPtr ns
, xmlC14NCtxPtr ctx
)
542 if ((ns
== NULL
) || (ctx
== NULL
)) {
543 xmlC14NErrParam("writing namespaces");
547 if (ns
->prefix
!= NULL
) {
548 xmlOutputBufferWriteString(ctx
->buf
, " xmlns:");
549 xmlOutputBufferWriteString(ctx
->buf
, (const char *) ns
->prefix
);
550 xmlOutputBufferWriteString(ctx
->buf
, "=");
552 xmlOutputBufferWriteString(ctx
->buf
, " xmlns=");
554 if(ns
->href
!= NULL
) {
555 xmlBufWriteQuotedString(ctx
->buf
->buffer
, ns
->href
);
557 xmlOutputBufferWriteString(ctx
->buf
, "\"\"");
563 * xmlC14NProcessNamespacesAxis:
564 * @ctx: the C14N context
565 * @node: the current node
567 * Prints out canonical namespace axis of the current node to the
568 * buffer from C14N context as follows
570 * Canonical XML v 1.0 (http://www.w3.org/TR/xml-c14n)
573 * Consider a list L containing only namespace nodes in the
574 * axis and in the node-set in lexicographic order (ascending). To begin
575 * processing L, if the first node is not the default namespace node (a node
576 * with no namespace URI and no local name), then generate a space followed
577 * by xmlns="" if and only if the following conditions are met:
578 * - the element E that owns the axis is in the node-set
579 * - The nearest ancestor element of E in the node-set has a default
580 * namespace node in the node-set (default namespace nodes always
581 * have non-empty values in XPath)
582 * The latter condition eliminates unnecessary occurrences of xmlns="" in
583 * the canonical form since an element only receives an xmlns="" if its
584 * default namespace is empty and if it has an immediate parent in the
585 * canonical form that has a non-empty default namespace. To finish
586 * processing L, simply process every namespace node in L, except omit
587 * namespace node with local name xml, which defines the xml prefix,
588 * if its string value is http://www.w3.org/XML/1998/namespace.
590 * Exclusive XML Canonicalization v 1.0 (http://www.w3.org/TR/xml-exc-c14n)
591 * Canonical XML applied to a document subset requires the search of the
592 * ancestor nodes of each orphan element node for attributes in the xml
593 * namespace, such as xml:lang and xml:space. These are copied into the
594 * element node except if a declaration of the same attribute is already
595 * in the attribute axis of the element (whether or not it is included in
596 * the document subset). This search and copying are omitted from the
597 * Exclusive XML Canonicalization method.
599 * Returns 0 on success or -1 on fail.
602 xmlC14NProcessNamespacesAxis(xmlC14NCtxPtr ctx
, xmlNodePtr cur
, int visible
)
607 int already_rendered
;
608 int has_empty_ns
= 0;
610 if ((ctx
== NULL
) || (cur
== NULL
) || (cur
->type
!= XML_ELEMENT_NODE
)) {
611 xmlC14NErrParam("processing namespaces axis (c14n)");
616 * Create a sorted list to store element namespaces
618 list
= xmlListCreate(NULL
, (xmlListDataCompare
) xmlC14NNsCompare
);
620 xmlC14NErrInternal("creating namespaces list (c14n)");
624 /* check all namespaces */
625 for(n
= cur
; n
!= NULL
; n
= n
->parent
) {
626 for(ns
= n
->nsDef
; ns
!= NULL
; ns
= ns
->next
) {
627 tmp
= xmlSearchNs(cur
->doc
, cur
, ns
->prefix
);
629 if((tmp
== ns
) && !xmlC14NIsXmlNs(ns
) && xmlC14NIsVisible(ctx
, ns
, cur
)) {
630 already_rendered
= xmlC14NVisibleNsStackFind(ctx
->ns_rendered
, ns
);
632 xmlC14NVisibleNsStackAdd(ctx
->ns_rendered
, ns
, cur
);
634 if(!already_rendered
) {
635 xmlListInsert(list
, ns
);
637 if(xmlStrlen(ns
->prefix
) == 0) {
645 * if the first node is not the default namespace node (a node with no
646 * namespace URI and no local name), then generate a space followed by
647 * xmlns="" if and only if the following conditions are met:
648 * - the element E that owns the axis is in the node-set
649 * - the nearest ancestor element of E in the node-set has a default
650 * namespace node in the node-set (default namespace nodes always
651 * have non-empty values in XPath)
653 if(visible
&& !has_empty_ns
) {
654 static xmlNs ns_default
;
656 memset(&ns_default
, 0, sizeof(ns_default
));
657 if(!xmlC14NVisibleNsStackFind(ctx
->ns_rendered
, &ns_default
)) {
658 xmlC14NPrintNamespaces(&ns_default
, ctx
);
664 * print out all elements from list
666 xmlListWalk(list
, (xmlListWalker
) xmlC14NPrintNamespaces
, (const void *) ctx
);
677 * xmlExcC14NProcessNamespacesAxis:
678 * @ctx: the C14N context
679 * @node: the current node
681 * Prints out exclusive canonical namespace axis of the current node to the
682 * buffer from C14N context as follows
684 * Exclusive XML Canonicalization
685 * http://www.w3.org/TR/xml-exc-c14n
687 * If the element node is in the XPath subset then output the node in
688 * accordance with Canonical XML except for namespace nodes which are
689 * rendered as follows:
691 * 1. Render each namespace node iff:
692 * * it is visibly utilized by the immediate parent element or one of
693 * its attributes, or is present in InclusiveNamespaces PrefixList, and
694 * * its prefix and value do not appear in ns_rendered. ns_rendered is
695 * obtained by popping the state stack in order to obtain a list of
696 * prefixes and their values which have already been rendered by
697 * an output ancestor of the namespace node's parent element.
698 * 2. Append the rendered namespace node to the list ns_rendered of namespace
699 * nodes rendered by output ancestors. Push ns_rendered on state stack and
701 * 3. After the recursion returns, pop thestate stack.
704 * Returns 0 on success or -1 on fail.
707 xmlExcC14NProcessNamespacesAxis(xmlC14NCtxPtr ctx
, xmlNodePtr cur
, int visible
)
712 int already_rendered
;
713 int has_empty_ns
= 0;
714 int has_visibly_utilized_empty_ns
= 0;
715 int has_empty_ns_in_inclusive_list
= 0;
717 if ((ctx
== NULL
) || (cur
== NULL
) || (cur
->type
!= XML_ELEMENT_NODE
)) {
718 xmlC14NErrParam("processing namespaces axis (exc c14n)");
722 if(!xmlC14NIsExclusive(ctx
)) {
723 xmlC14NErrParam("processing namespaces axis (exc c14n)");
729 * Create a sorted list to store element namespaces
731 list
= xmlListCreate(NULL
, (xmlListDataCompare
) xmlC14NNsCompare
);
733 xmlC14NErrInternal("creating namespaces list (exc c14n)");
738 * process inclusive namespaces:
739 * All namespace nodes appearing on inclusive ns list are
740 * handled as provided in Canonical XML
742 if(ctx
->inclusive_ns_prefixes
!= NULL
) {
746 for (i
= 0; ctx
->inclusive_ns_prefixes
[i
] != NULL
; ++i
) {
747 prefix
= ctx
->inclusive_ns_prefixes
[i
];
749 * Special values for namespace with empty prefix
751 if (xmlStrEqual(prefix
, BAD_CAST
"#default")
752 || xmlStrEqual(prefix
, BAD_CAST
"")) {
754 has_empty_ns_in_inclusive_list
= 1;
757 ns
= xmlSearchNs(cur
->doc
, cur
, prefix
);
758 if((ns
!= NULL
) && !xmlC14NIsXmlNs(ns
) && xmlC14NIsVisible(ctx
, ns
, cur
)) {
759 already_rendered
= xmlC14NVisibleNsStackFind(ctx
->ns_rendered
, ns
);
761 xmlC14NVisibleNsStackAdd(ctx
->ns_rendered
, ns
, cur
);
763 if(!already_rendered
) {
764 xmlListInsert(list
, ns
);
766 if(xmlStrlen(ns
->prefix
) == 0) {
773 /* add node namespace */
774 if(cur
->ns
!= NULL
) {
777 ns
= xmlSearchNs(cur
->doc
, cur
, NULL
);
778 has_visibly_utilized_empty_ns
= 1;
780 if((ns
!= NULL
) && !xmlC14NIsXmlNs(ns
)) {
781 if(visible
&& xmlC14NIsVisible(ctx
, ns
, cur
)) {
782 if(!xmlExcC14NVisibleNsStackFind(ctx
->ns_rendered
, ns
, ctx
)) {
783 xmlListInsert(list
, ns
);
787 xmlC14NVisibleNsStackAdd(ctx
->ns_rendered
, ns
, cur
);
789 if(xmlStrlen(ns
->prefix
) == 0) {
796 for(attr
= cur
->properties
; attr
!= NULL
; attr
= attr
->next
) {
798 * we need to check that attribute is visible and has non
799 * default namespace (XML Namespaces: "default namespaces
800 * do not apply directly to attributes")
802 if((attr
->ns
!= NULL
) && !xmlC14NIsXmlNs(attr
->ns
) && xmlC14NIsVisible(ctx
, attr
, cur
)) {
803 already_rendered
= xmlExcC14NVisibleNsStackFind(ctx
->ns_rendered
, attr
->ns
, ctx
);
804 xmlC14NVisibleNsStackAdd(ctx
->ns_rendered
, attr
->ns
, cur
);
805 if(!already_rendered
&& visible
) {
806 xmlListInsert(list
, attr
->ns
);
808 if(xmlStrlen(attr
->ns
->prefix
) == 0) {
811 } else if((attr
->ns
!= NULL
) && (xmlStrlen(attr
->ns
->prefix
) == 0) && (xmlStrlen(attr
->ns
->href
) == 0)) {
812 has_visibly_utilized_empty_ns
= 1;
819 if(visible
&& has_visibly_utilized_empty_ns
&&
820 !has_empty_ns
&& !has_empty_ns_in_inclusive_list
) {
821 static xmlNs ns_default
;
823 memset(&ns_default
, 0, sizeof(ns_default
));
825 already_rendered
= xmlExcC14NVisibleNsStackFind(ctx
->ns_rendered
, &ns_default
, ctx
);
826 if(!already_rendered
) {
827 xmlC14NPrintNamespaces(&ns_default
, ctx
);
829 } else if(visible
&& !has_empty_ns
&& has_empty_ns_in_inclusive_list
) {
830 static xmlNs ns_default
;
832 memset(&ns_default
, 0, sizeof(ns_default
));
833 if(!xmlC14NVisibleNsStackFind(ctx
->ns_rendered
, &ns_default
)) {
834 xmlC14NPrintNamespaces(&ns_default
, ctx
);
841 * print out all elements from list
843 xmlListWalk(list
, (xmlListWalker
) xmlC14NPrintNamespaces
, (const void *) ctx
);
855 * @attr: the attr to check
857 * Checks whether the given attribute is a default "xml:" namespace
858 * with href="http://www.w3.org/XML/1998/namespace"
860 * Returns 1 if the node is default or 0 otherwise
863 /* todo: make it a define? */
865 xmlC14NIsXmlAttr(xmlAttrPtr attr
)
867 return ((attr
->ns
!= NULL
) &&
868 (xmlC14NIsXmlNs(attr
->ns
) != 0));
873 * xmlC14NAttrsCompare:
874 * @attr1: the pointer tls o first attr
875 * @attr2: the pointer to second attr
877 * Prints the given attribute to the output buffer from C14N context.
879 * Returns -1 if attr1 < attr2, 0 if attr1 == attr2 or 1 if attr1 > attr2.
882 xmlC14NAttrsCompare(xmlAttrPtr attr1
, xmlAttrPtr attr2
)
895 if (attr1
->ns
== attr2
->ns
) {
896 return (xmlStrcmp(attr1
->name
, attr2
->name
));
900 * Attributes in the default namespace are first
901 * because the default namespace is not applied to
902 * unqualified attributes
904 if (attr1
->ns
== NULL
)
906 if (attr2
->ns
== NULL
)
908 if (attr1
->ns
->prefix
== NULL
)
910 if (attr2
->ns
->prefix
== NULL
)
913 ret
= xmlStrcmp(attr1
->ns
->href
, attr2
->ns
->href
);
915 ret
= xmlStrcmp(attr1
->name
, attr2
->name
);
923 * @attr: the pointer to attr
924 * @ctx: the C14N context
926 * Prints out canonical attribute urrent node to the
927 * buffer from C14N context as follows
929 * Canonical XML v 1.0 (http://www.w3.org/TR/xml-c14n)
931 * Returns 1 on success or 0 on fail.
934 xmlC14NPrintAttrs(const xmlAttrPtr attr
, xmlC14NCtxPtr ctx
)
939 if ((attr
== NULL
) || (ctx
== NULL
)) {
940 xmlC14NErrParam("writing attributes");
944 xmlOutputBufferWriteString(ctx
->buf
, " ");
945 if (attr
->ns
!= NULL
&& xmlStrlen(attr
->ns
->prefix
) > 0) {
946 xmlOutputBufferWriteString(ctx
->buf
,
947 (const char *) attr
->ns
->prefix
);
948 xmlOutputBufferWriteString(ctx
->buf
, ":");
950 xmlOutputBufferWriteString(ctx
->buf
, (const char *) attr
->name
);
951 xmlOutputBufferWriteString(ctx
->buf
, "=\"");
953 value
= xmlNodeListGetString(ctx
->doc
, attr
->children
, 1);
954 /* todo: should we log an error if value==NULL ? */
956 buffer
= xmlC11NNormalizeAttr(value
);
958 if (buffer
!= NULL
) {
959 xmlOutputBufferWriteString(ctx
->buf
, (const char *) buffer
);
962 xmlC14NErrInternal("normalizing attributes axis");
966 xmlOutputBufferWriteString(ctx
->buf
, "\"");
971 * xmlC14NFindHiddenParentAttr:
973 * Finds an attribute in a hidden parent node.
975 * Returns a pointer to the attribute node (if found) or NULL otherwise.
978 xmlC14NFindHiddenParentAttr(xmlC14NCtxPtr ctx
, xmlNodePtr cur
, const xmlChar
* name
, const xmlChar
* ns
)
981 while((cur
!= NULL
) && (!xmlC14NIsVisible(ctx
, cur
, cur
->parent
))) {
982 res
= xmlHasNsProp(cur
, name
, ns
);
994 * xmlC14NFixupBaseAttr:
996 * Fixes up the xml:base attribute
998 * Returns the newly created attribute or NULL
1001 xmlC14NFixupBaseAttr(xmlC14NCtxPtr ctx
, xmlAttrPtr xml_base_attr
)
1003 xmlChar
* res
= NULL
;
1010 if ((ctx
== NULL
) || (xml_base_attr
== NULL
) || (xml_base_attr
->parent
== NULL
)) {
1011 xmlC14NErrParam("processing xml:base attribute");
1015 /* start from current value */
1016 res
= xmlNodeListGetString(ctx
->doc
, xml_base_attr
->children
, 1);
1018 xmlC14NErrInternal("processing xml:base attribute - can't get attr value");
1022 /* go up the stack until we find a node that we rendered already */
1023 cur
= xml_base_attr
->parent
->parent
;
1024 while((cur
!= NULL
) && (!xmlC14NIsVisible(ctx
, cur
, cur
->parent
))) {
1025 attr
= xmlHasNsProp(cur
, BAD_CAST
"base", XML_XML_NAMESPACE
);
1027 /* get attr value */
1028 tmp_str
= xmlNodeListGetString(ctx
->doc
, attr
->children
, 1);
1029 if(tmp_str
== NULL
) {
1032 xmlC14NErrInternal("processing xml:base attribute - can't get attr value");
1036 /* we need to add '/' if our current base uri ends with '..' or '.'
1037 to ensure that we are forced to go "up" all the time */
1038 tmp_str_len
= xmlStrlen(tmp_str
);
1039 if(tmp_str_len
> 1 && tmp_str
[tmp_str_len
- 2] == '.') {
1040 tmp_str2
= xmlStrcat(tmp_str
, BAD_CAST
"/");
1041 if(tmp_str2
== NULL
) {
1045 xmlC14NErrInternal("processing xml:base attribute - can't modify uri");
1053 tmp_str2
= xmlBuildURI(res
, tmp_str
);
1054 if(tmp_str2
== NULL
) {
1058 xmlC14NErrInternal("processing xml:base attribute - can't construct uri");
1062 /* cleanup and set the new res */
1072 /* check if result uri is empty or not */
1073 if((res
== NULL
) || xmlStrEqual(res
, BAD_CAST
"")) {
1078 /* create and return the new attribute node */
1079 attr
= xmlNewNsProp(NULL
, xml_base_attr
->ns
, BAD_CAST
"base", res
);
1083 xmlC14NErrInternal("processing xml:base attribute - can't construct attribute");
1093 * xmlC14NProcessAttrsAxis:
1094 * @ctx: the C14N context
1095 * @cur: the current node
1096 * @parent_visible: the visibility of parent node
1097 * @all_parents_visible: the visibility of all parent nodes
1099 * Prints out canonical attribute axis of the current node to the
1100 * buffer from C14N context as follows
1102 * Canonical XML v 1.0 (http://www.w3.org/TR/xml-c14n)
1105 * In lexicographic order (ascending), process each node that
1106 * is in the element's attribute axis and in the node-set.
1108 * The processing of an element node E MUST be modified slightly
1109 * when an XPath node-set is given as input and the element's
1110 * parent is omitted from the node-set.
1113 * Exclusive XML Canonicalization v 1.0 (http://www.w3.org/TR/xml-exc-c14n)
1115 * Canonical XML applied to a document subset requires the search of the
1116 * ancestor nodes of each orphan element node for attributes in the xml
1117 * namespace, such as xml:lang and xml:space. These are copied into the
1118 * element node except if a declaration of the same attribute is already
1119 * in the attribute axis of the element (whether or not it is included in
1120 * the document subset). This search and copying are omitted from the
1121 * Exclusive XML Canonicalization method.
1123 * Returns 0 on success or -1 on fail.
1126 xmlC14NProcessAttrsAxis(xmlC14NCtxPtr ctx
, xmlNodePtr cur
, int parent_visible
)
1130 xmlAttrPtr attrs_to_delete
= NULL
;
1132 /* special processing for 1.1 spec */
1133 xmlAttrPtr xml_base_attr
= NULL
;
1134 xmlAttrPtr xml_lang_attr
= NULL
;
1135 xmlAttrPtr xml_space_attr
= NULL
;
1137 if ((ctx
== NULL
) || (cur
== NULL
) || (cur
->type
!= XML_ELEMENT_NODE
)) {
1138 xmlC14NErrParam("processing attributes axis");
1143 * Create a sorted list to store element attributes
1145 list
= xmlListCreate(NULL
, (xmlListDataCompare
) xmlC14NAttrsCompare
);
1147 xmlC14NErrInternal("creating attributes list");
1153 /* The processing of an element node E MUST be modified slightly when an XPath node-set is
1154 * given as input and the element's parent is omitted from the node-set. The method for processing
1155 * the attribute axis of an element E in the node-set is enhanced. All element nodes along E's
1156 * ancestor axis are examined for nearest occurrences of attributes in the xml namespace, such
1157 * as xml:lang and xml:space (whether or not they are in the node-set). From this list of attributes,
1158 * remove any that are in E's attribute axis (whether or not they are in the node-set). Then,
1159 * lexicographically merge this attribute list with the nodes of E's attribute axis that are in
1160 * the node-set. The result of visiting the attribute axis is computed by processing the attribute
1161 * nodes in this merged attribute list.
1165 * Add all visible attributes from current node.
1167 attr
= cur
->properties
;
1168 while (attr
!= NULL
) {
1169 /* check that attribute is visible */
1170 if (xmlC14NIsVisible(ctx
, attr
, cur
)) {
1171 xmlListInsert(list
, attr
);
1177 * Handle xml attributes
1179 if (parent_visible
&& (cur
->parent
!= NULL
) &&
1180 (!xmlC14NIsVisible(ctx
, cur
->parent
, cur
->parent
->parent
)))
1185 * If XPath node-set is not specified then the parent is always
1189 while (tmp
!= NULL
) {
1190 attr
= tmp
->properties
;
1191 while (attr
!= NULL
) {
1192 if (xmlC14NIsXmlAttr(attr
) != 0) {
1193 if (xmlListSearch(list
, attr
) == NULL
) {
1194 xmlListInsert(list
, attr
);
1205 case XML_C14N_EXCLUSIVE_1_0
:
1206 /* attributes in the XML namespace, such as xml:lang and xml:space
1207 * are not imported into orphan nodes of the document subset
1211 * Add all visible attributes from current node.
1213 attr
= cur
->properties
;
1214 while (attr
!= NULL
) {
1215 /* check that attribute is visible */
1216 if (xmlC14NIsVisible(ctx
, attr
, cur
)) {
1217 xmlListInsert(list
, attr
);
1222 /* do nothing special for xml attributes */
1225 /* The processing of an element node E MUST be modified slightly when an XPath node-set is
1226 * given as input and some of the element's ancestors are omitted from the node-set.
1228 * Simple inheritable attributes are attributes that have a value that requires at most a simple
1229 * redeclaration. This redeclaration is done by supplying a new value in the child axis. The
1230 * redeclaration of a simple inheritable attribute A contained in one of E's ancestors is done
1231 * by supplying a value to an attribute Ae inside E with the same name. Simple inheritable attributes
1232 * are xml:lang and xml:space.
1234 * The method for processing the attribute axis of an element E in the node-set is hence enhanced.
1235 * All element nodes along E's ancestor axis are examined for the nearest occurrences of simple
1236 * inheritable attributes in the xml namespace, such as xml:lang and xml:space (whether or not they
1237 * are in the node-set). From this list of attributes, any simple inheritable attributes that are
1238 * already in E's attribute axis (whether or not they are in the node-set) are removed. Then,
1239 * lexicographically merge this attribute list with the nodes of E's attribute axis that are in
1240 * the node-set. The result of visiting the attribute axis is computed by processing the attribute
1241 * nodes in this merged attribute list.
1243 * The xml:id attribute is not a simple inheritable attribute and no processing of these attributes is
1246 * The xml:base attribute is not a simple inheritable attribute and requires special processing beyond
1247 * a simple redeclaration.
1249 * Attributes in the XML namespace other than xml:base, xml:id, xml:lang, and xml:space MUST be processed
1250 * as ordinary attributes.
1254 * Add all visible attributes from current node.
1256 attr
= cur
->properties
;
1257 while (attr
!= NULL
) {
1258 /* special processing for XML attribute kiks in only when we have invisible parents */
1259 if ((!parent_visible
) || (xmlC14NIsXmlAttr(attr
) == 0)) {
1260 /* check that attribute is visible */
1261 if (xmlC14NIsVisible(ctx
, attr
, cur
)) {
1262 xmlListInsert(list
, attr
);
1267 /* check for simple inheritance attributes */
1268 if((!matched
) && (xml_lang_attr
== NULL
) && xmlStrEqual(attr
->name
, BAD_CAST
"lang")) {
1269 xml_lang_attr
= attr
;
1272 if((!matched
) && (xml_space_attr
== NULL
) && xmlStrEqual(attr
->name
, BAD_CAST
"space")) {
1273 xml_space_attr
= attr
;
1277 /* check for base attr */
1278 if((!matched
) && (xml_base_attr
== NULL
) && xmlStrEqual(attr
->name
, BAD_CAST
"base")) {
1279 xml_base_attr
= attr
;
1283 /* otherwise, it is a normal attribute, so just check if it is visible */
1284 if((!matched
) && xmlC14NIsVisible(ctx
, attr
, cur
)) {
1285 xmlListInsert(list
, attr
);
1289 /* move to the next one */
1293 /* special processing for XML attribute kiks in only when we have invisible parents */
1294 if ((parent_visible
)) {
1296 /* simple inheritance attributes - copy */
1297 if(xml_lang_attr
== NULL
) {
1298 xml_lang_attr
= xmlC14NFindHiddenParentAttr(ctx
, cur
->parent
, BAD_CAST
"lang", XML_XML_NAMESPACE
);
1300 if(xml_lang_attr
!= NULL
) {
1301 xmlListInsert(list
, xml_lang_attr
);
1303 if(xml_space_attr
== NULL
) {
1304 xml_space_attr
= xmlC14NFindHiddenParentAttr(ctx
, cur
->parent
, BAD_CAST
"space", XML_XML_NAMESPACE
);
1306 if(xml_space_attr
!= NULL
) {
1307 xmlListInsert(list
, xml_space_attr
);
1310 /* base uri attribute - fix up */
1311 if(xml_base_attr
== NULL
) {
1312 /* if we don't have base uri attribute, check if we have a "hidden" one above */
1313 xml_base_attr
= xmlC14NFindHiddenParentAttr(ctx
, cur
->parent
, BAD_CAST
"base", XML_XML_NAMESPACE
);
1315 if(xml_base_attr
!= NULL
) {
1316 xml_base_attr
= xmlC14NFixupBaseAttr(ctx
, xml_base_attr
);
1317 if(xml_base_attr
!= NULL
) {
1318 xmlListInsert(list
, xml_base_attr
);
1320 /* note that we MUST delete returned attr node ourselves! */
1321 xml_base_attr
->next
= attrs_to_delete
;
1322 attrs_to_delete
= xml_base_attr
;
1332 * print out all elements from list
1334 xmlListWalk(list
, (xmlListWalker
) xmlC14NPrintAttrs
, (const void *) ctx
);
1339 xmlFreePropList(attrs_to_delete
);
1340 xmlListDelete(list
);
1345 * xmlC14NCheckForRelativeNamespaces:
1346 * @ctx: the C14N context
1347 * @cur: the current element node
1349 * Checks that current element node has no relative namespaces defined
1351 * Returns 0 if the node has no relative namespaces or -1 otherwise.
1354 xmlC14NCheckForRelativeNamespaces(xmlC14NCtxPtr ctx
, xmlNodePtr cur
)
1358 if ((ctx
== NULL
) || (cur
== NULL
) || (cur
->type
!= XML_ELEMENT_NODE
)) {
1359 xmlC14NErrParam("checking for relative namespaces");
1364 while (ns
!= NULL
) {
1365 if (xmlStrlen(ns
->href
) > 0) {
1368 uri
= xmlParseURI((const char *) ns
->href
);
1370 xmlC14NErrInternal("parsing namespace uri");
1373 if (xmlStrlen((const xmlChar
*) uri
->scheme
) == 0) {
1374 xmlC14NErrRelativeNamespace(uri
->scheme
);
1378 if ((xmlStrcasecmp((const xmlChar
*) uri
->scheme
, BAD_CAST
"urn") != 0)
1379 && (xmlStrcasecmp((const xmlChar
*) uri
->scheme
, BAD_CAST
"dav") !=0)
1380 && (xmlStrlen((const xmlChar
*) uri
->server
) == 0)) {
1381 xmlC14NErrRelativeNamespace(uri
->scheme
);
1393 * xmlC14NProcessElementNode:
1394 * @ctx: the pointer to C14N context object
1395 * @cur: the node to process
1396 * @visible: this node is visible
1397 * @all_parents_visible: whether all the parents of this node are visible
1399 * Canonical XML v 1.0 (http://www.w3.org/TR/xml-c14n)
1402 * If the element is not in the node-set, then the result is obtained
1403 * by processing the namespace axis, then the attribute axis, then
1404 * processing the child nodes of the element that are in the node-set
1405 * (in document order). If the element is in the node-set, then the result
1406 * is an open angle bracket (<), the element QName, the result of
1407 * processing the namespace axis, the result of processing the attribute
1408 * axis, a close angle bracket (>), the result of processing the child
1409 * nodes of the element that are in the node-set (in document order), an
1410 * open angle bracket, a forward slash (/), the element QName, and a close
1413 * Returns non-negative value on success or negative value on fail
1416 xmlC14NProcessElementNode(xmlC14NCtxPtr ctx
, xmlNodePtr cur
, int visible
)
1419 xmlC14NVisibleNsStack state
;
1420 int parent_is_doc
= 0;
1422 if ((ctx
== NULL
) || (cur
== NULL
) || (cur
->type
!= XML_ELEMENT_NODE
)) {
1423 xmlC14NErrParam("processing element node");
1428 * Check relative relative namespaces:
1429 * implementations of XML canonicalization MUST report an operation
1430 * failure on documents containing relative namespace URIs.
1432 if (xmlC14NCheckForRelativeNamespaces(ctx
, cur
) < 0) {
1433 xmlC14NErrInternal("checking for relative namespaces");
1439 * Save ns_rendered stack position
1441 memset(&state
, 0, sizeof(state
));
1442 xmlC14NVisibleNsStackSave(ctx
->ns_rendered
, &state
);
1445 if (ctx
->parent_is_doc
) {
1446 /* save this flag into the stack */
1447 parent_is_doc
= ctx
->parent_is_doc
;
1448 ctx
->parent_is_doc
= 0;
1449 ctx
->pos
= XMLC14N_INSIDE_DOCUMENT_ELEMENT
;
1451 xmlOutputBufferWriteString(ctx
->buf
, "<");
1453 if ((cur
->ns
!= NULL
) && (xmlStrlen(cur
->ns
->prefix
) > 0)) {
1454 xmlOutputBufferWriteString(ctx
->buf
,
1455 (const char *) cur
->ns
->prefix
);
1456 xmlOutputBufferWriteString(ctx
->buf
, ":");
1458 xmlOutputBufferWriteString(ctx
->buf
, (const char *) cur
->name
);
1461 if (!xmlC14NIsExclusive(ctx
)) {
1462 ret
= xmlC14NProcessNamespacesAxis(ctx
, cur
, visible
);
1464 ret
= xmlExcC14NProcessNamespacesAxis(ctx
, cur
, visible
);
1467 xmlC14NErrInternal("processing namespaces axis");
1470 /* todo: shouldn't this go to "visible only"? */
1472 xmlC14NVisibleNsStackShift(ctx
->ns_rendered
);
1475 ret
= xmlC14NProcessAttrsAxis(ctx
, cur
, visible
);
1477 xmlC14NErrInternal("processing attributes axis");
1482 xmlOutputBufferWriteString(ctx
->buf
, ">");
1484 if (cur
->children
!= NULL
) {
1485 ret
= xmlC14NProcessNodeList(ctx
, cur
->children
);
1487 xmlC14NErrInternal("processing childrens list");
1492 xmlOutputBufferWriteString(ctx
->buf
, "</");
1493 if ((cur
->ns
!= NULL
) && (xmlStrlen(cur
->ns
->prefix
) > 0)) {
1494 xmlOutputBufferWriteString(ctx
->buf
,
1495 (const char *) cur
->ns
->prefix
);
1496 xmlOutputBufferWriteString(ctx
->buf
, ":");
1498 xmlOutputBufferWriteString(ctx
->buf
, (const char *) cur
->name
);
1499 xmlOutputBufferWriteString(ctx
->buf
, ">");
1500 if (parent_is_doc
) {
1501 /* restore this flag from the stack for next node */
1502 ctx
->parent_is_doc
= parent_is_doc
;
1503 ctx
->pos
= XMLC14N_AFTER_DOCUMENT_ELEMENT
;
1508 * Restore ns_rendered stack position
1510 xmlC14NVisibleNsStackRestore(ctx
->ns_rendered
, &state
);
1515 * xmlC14NProcessNode:
1516 * @ctx: the pointer to C14N context object
1517 * @cur: the node to process
1519 * Processes the given node
1521 * Returns non-negative value on success or negative value on fail
1524 xmlC14NProcessNode(xmlC14NCtxPtr ctx
, xmlNodePtr cur
)
1529 if ((ctx
== NULL
) || (cur
== NULL
)) {
1530 xmlC14NErrParam("processing node");
1534 visible
= xmlC14NIsVisible(ctx
, cur
, cur
->parent
);
1535 switch (cur
->type
) {
1536 case XML_ELEMENT_NODE
:
1537 ret
= xmlC14NProcessElementNode(ctx
, cur
, visible
);
1539 case XML_CDATA_SECTION_NODE
:
1543 * the string value, except all ampersands are replaced
1544 * by &, all open angle brackets (<) are replaced by <, all closing
1545 * angle brackets (>) are replaced by >, and all #xD characters are
1546 * replaced by 
.
1548 /* cdata sections are processed as text nodes */
1549 /* todo: verify that cdata sections are included in XPath nodes set */
1550 if ((visible
) && (cur
->content
!= NULL
)) {
1553 buffer
= xmlC11NNormalizeText(cur
->content
);
1554 if (buffer
!= NULL
) {
1555 xmlOutputBufferWriteString(ctx
->buf
,
1556 (const char *) buffer
);
1559 xmlC14NErrInternal("normalizing text node");
1566 * Processing Instruction (PI) Nodes-
1567 * The opening PI symbol (<?), the PI target name of the node,
1568 * a leading space and the string value if it is not empty, and
1569 * the closing PI symbol (?>). If the string value is empty,
1570 * then the leading space is not added. Also, a trailing #xA is
1571 * rendered after the closing PI symbol for PI children of the
1572 * root node with a lesser document order than the document
1573 * element, and a leading #xA is rendered before the opening PI
1574 * symbol of PI children of the root node with a greater document
1575 * order than the document element.
1578 if (ctx
->pos
== XMLC14N_AFTER_DOCUMENT_ELEMENT
) {
1579 xmlOutputBufferWriteString(ctx
->buf
, "\x0A<?");
1581 xmlOutputBufferWriteString(ctx
->buf
, "<?");
1584 xmlOutputBufferWriteString(ctx
->buf
,
1585 (const char *) cur
->name
);
1586 if ((cur
->content
!= NULL
) && (*(cur
->content
) != '\0')) {
1589 xmlOutputBufferWriteString(ctx
->buf
, " ");
1591 /* todo: do we need to normalize pi? */
1592 buffer
= xmlC11NNormalizePI(cur
->content
);
1593 if (buffer
!= NULL
) {
1594 xmlOutputBufferWriteString(ctx
->buf
,
1595 (const char *) buffer
);
1598 xmlC14NErrInternal("normalizing pi node");
1603 if (ctx
->pos
== XMLC14N_BEFORE_DOCUMENT_ELEMENT
) {
1604 xmlOutputBufferWriteString(ctx
->buf
, "?>\x0A");
1606 xmlOutputBufferWriteString(ctx
->buf
, "?>");
1610 case XML_COMMENT_NODE
:
1613 * Nothing if generating canonical XML without comments. For
1614 * canonical XML with comments, generate the opening comment
1615 * symbol (<!--), the string value of the node, and the
1616 * closing comment symbol (-->). Also, a trailing #xA is rendered
1617 * after the closing comment symbol for comment children of the
1618 * root node with a lesser document order than the document
1619 * element, and a leading #xA is rendered before the opening
1620 * comment symbol of comment children of the root node with a
1621 * greater document order than the document element. (Comment
1622 * children of the root node represent comments outside of the
1623 * top-level document element and outside of the document type
1626 if (visible
&& ctx
->with_comments
) {
1627 if (ctx
->pos
== XMLC14N_AFTER_DOCUMENT_ELEMENT
) {
1628 xmlOutputBufferWriteString(ctx
->buf
, "\x0A<!--");
1630 xmlOutputBufferWriteString(ctx
->buf
, "<!--");
1633 if (cur
->content
!= NULL
) {
1636 /* todo: do we need to normalize comment? */
1637 buffer
= xmlC11NNormalizeComment(cur
->content
);
1638 if (buffer
!= NULL
) {
1639 xmlOutputBufferWriteString(ctx
->buf
,
1640 (const char *) buffer
);
1643 xmlC14NErrInternal("normalizing comment node");
1648 if (ctx
->pos
== XMLC14N_BEFORE_DOCUMENT_ELEMENT
) {
1649 xmlOutputBufferWriteString(ctx
->buf
, "-->\x0A");
1651 xmlOutputBufferWriteString(ctx
->buf
, "-->");
1655 case XML_DOCUMENT_NODE
:
1656 case XML_DOCUMENT_FRAG_NODE
: /* should be processed as document? */
1657 #ifdef LIBXML_DOCB_ENABLED
1658 case XML_DOCB_DOCUMENT_NODE
: /* should be processed as document? */
1660 #ifdef LIBXML_HTML_ENABLED
1661 case XML_HTML_DOCUMENT_NODE
: /* should be processed as document? */
1663 if (cur
->children
!= NULL
) {
1664 ctx
->pos
= XMLC14N_BEFORE_DOCUMENT_ELEMENT
;
1665 ctx
->parent_is_doc
= 1;
1666 ret
= xmlC14NProcessNodeList(ctx
, cur
->children
);
1670 case XML_ATTRIBUTE_NODE
:
1671 xmlC14NErrInvalidNode("XML_ATTRIBUTE_NODE", "processing node");
1673 case XML_NAMESPACE_DECL
:
1674 xmlC14NErrInvalidNode("XML_NAMESPACE_DECL", "processing node");
1676 case XML_ENTITY_REF_NODE
:
1677 xmlC14NErrInvalidNode("XML_ENTITY_REF_NODE", "processing node");
1679 case XML_ENTITY_NODE
:
1680 xmlC14NErrInvalidNode("XML_ENTITY_NODE", "processing node");
1683 case XML_DOCUMENT_TYPE_NODE
:
1684 case XML_NOTATION_NODE
:
1686 case XML_ELEMENT_DECL
:
1687 case XML_ATTRIBUTE_DECL
:
1688 case XML_ENTITY_DECL
:
1689 #ifdef LIBXML_XINCLUDE_ENABLED
1690 case XML_XINCLUDE_START
:
1691 case XML_XINCLUDE_END
:
1694 * should be ignored according to "W3C Canonical XML"
1698 xmlC14NErrUnknownNode(cur
->type
, "processing node");
1706 * xmlC14NProcessNodeList:
1707 * @ctx: the pointer to C14N context object
1708 * @cur: the node to start from
1710 * Processes all nodes in the row starting from cur.
1712 * Returns non-negative value on success or negative value on fail
1715 xmlC14NProcessNodeList(xmlC14NCtxPtr ctx
, xmlNodePtr cur
)
1720 xmlC14NErrParam("processing node list");
1724 for (ret
= 0; cur
!= NULL
&& ret
>= 0; cur
= cur
->next
) {
1725 ret
= xmlC14NProcessNode(ctx
, cur
);
1733 * @ctx: the pointer to C14N context object
1735 * Cleanups the C14N context object.
1739 xmlC14NFreeCtx(xmlC14NCtxPtr ctx
)
1742 xmlC14NErrParam("freeing context");
1746 if (ctx
->ns_rendered
!= NULL
) {
1747 xmlC14NVisibleNsStackDestroy(ctx
->ns_rendered
);
1754 * @doc: the XML document for canonization
1755 * @is_visible_callback:the function to use to determine is node visible
1757 * @user_data: the first parameter for @is_visible_callback function
1758 * (in most cases, it is nodes set)
1759 * @mode: the c14n mode (see @xmlC14NMode)
1760 * @inclusive_ns_prefixe the list of inclusive namespace prefixes
1761 * ended with a NULL or NULL if there is no
1762 * inclusive namespaces (only for `
1764 * @with_comments: include comments in the result (!=0) or not (==0)
1765 * @buf: the output buffer to store canonical XML; this
1766 * buffer MUST have encoder==NULL because C14N requires
1769 * Creates new C14N context object to store C14N parameters.
1771 * Returns pointer to newly created object (success) or NULL (fail)
1773 static xmlC14NCtxPtr
1774 xmlC14NNewCtx(xmlDocPtr doc
,
1775 xmlC14NIsVisibleCallback is_visible_callback
, void* user_data
,
1776 xmlC14NMode mode
, xmlChar
** inclusive_ns_prefixes
,
1777 int with_comments
, xmlOutputBufferPtr buf
)
1779 xmlC14NCtxPtr ctx
= NULL
;
1781 if ((doc
== NULL
) || (buf
== NULL
)) {
1782 xmlC14NErrParam("creating new context");
1787 * Validate the encoding output buffer encoding
1789 if (buf
->encoder
!= NULL
) {
1790 xmlC14NErr(ctx
, (xmlNodePtr
) doc
, XML_C14N_REQUIRES_UTF8
,
1791 "xmlC14NNewCtx: output buffer encoder != NULL but C14N requires UTF8 output\n");
1796 * Validate the XML document encoding value, if provided.
1798 if (doc
->charset
!= XML_CHAR_ENCODING_UTF8
) {
1799 xmlC14NErr(ctx
, (xmlNodePtr
) doc
, XML_C14N_REQUIRES_UTF8
,
1800 "xmlC14NNewCtx: source document not in UTF8\n");
1805 * Allocate a new xmlC14NCtxPtr and fill the fields.
1807 ctx
= (xmlC14NCtxPtr
) xmlMalloc(sizeof(xmlC14NCtx
));
1809 xmlC14NErrMemory("creating context");
1812 memset(ctx
, 0, sizeof(xmlC14NCtx
));
1815 * initialize C14N context
1818 ctx
->with_comments
= with_comments
;
1819 ctx
->is_visible_callback
= is_visible_callback
;
1820 ctx
->user_data
= user_data
;
1822 ctx
->parent_is_doc
= 1;
1823 ctx
->pos
= XMLC14N_BEFORE_DOCUMENT_ELEMENT
;
1824 ctx
->ns_rendered
= xmlC14NVisibleNsStackCreate();
1826 if(ctx
->ns_rendered
== NULL
) {
1827 xmlC14NErr(ctx
, (xmlNodePtr
) doc
, XML_C14N_CREATE_STACK
,
1828 "xmlC14NNewCtx: xmlC14NVisibleNsStackCreate failed\n");
1829 xmlC14NFreeCtx(ctx
);
1834 * Set "mode" flag and remember list of incluseve prefixes
1835 * for exclusive c14n
1838 if(xmlC14NIsExclusive(ctx
)) {
1839 ctx
->inclusive_ns_prefixes
= inclusive_ns_prefixes
;
1846 * @doc: the XML document for canonization
1847 * @is_visible_callback:the function to use to determine is node visible
1849 * @user_data: the first parameter for @is_visible_callback function
1850 * (in most cases, it is nodes set)
1851 * @mode: the c14n mode (see @xmlC14NMode)
1852 * @inclusive_ns_prefixes: the list of inclusive namespace prefixes
1853 * ended with a NULL or NULL if there is no
1854 * inclusive namespaces (only for exclusive
1855 * canonicalization, ignored otherwise)
1856 * @with_comments: include comments in the result (!=0) or not (==0)
1857 * @buf: the output buffer to store canonical XML; this
1858 * buffer MUST have encoder==NULL because C14N requires
1861 * Dumps the canonized image of given XML document into the provided buffer.
1862 * For details see "Canonical XML" (http://www.w3.org/TR/xml-c14n) or
1863 * "Exclusive XML Canonicalization" (http://www.w3.org/TR/xml-exc-c14n)
1865 * Returns non-negative value on success or a negative value on fail
1868 xmlC14NExecute(xmlDocPtr doc
, xmlC14NIsVisibleCallback is_visible_callback
,
1869 void* user_data
, int mode
, xmlChar
**inclusive_ns_prefixes
,
1870 int with_comments
, xmlOutputBufferPtr buf
) {
1873 xmlC14NMode c14n_mode
= XML_C14N_1_0
;
1876 if ((buf
== NULL
) || (doc
== NULL
)) {
1877 xmlC14NErrParam("executing c14n");
1881 /* for backward compatibility, we have to have "mode" as "int"
1882 and here we check that user gives valid value */
1885 case XML_C14N_EXCLUSIVE_1_0
:
1887 c14n_mode
= (xmlC14NMode
)mode
;
1890 xmlC14NErrParam("invalid mode for executing c14n");
1895 * Validate the encoding output buffer encoding
1897 if (buf
->encoder
!= NULL
) {
1898 xmlC14NErr(NULL
, (xmlNodePtr
) doc
, XML_C14N_REQUIRES_UTF8
,
1899 "xmlC14NExecute: output buffer encoder != NULL but C14N requires UTF8 output\n");
1903 ctx
= xmlC14NNewCtx(doc
, is_visible_callback
, user_data
,
1904 c14n_mode
, inclusive_ns_prefixes
,
1905 with_comments
, buf
);
1907 xmlC14NErr(NULL
, (xmlNodePtr
) doc
, XML_C14N_CREATE_CTXT
,
1908 "xmlC14NExecute: unable to create C14N context\n");
1916 * The root node is the parent of the top-level document element. The
1917 * result of processing each of its child nodes that is in the node-set
1918 * in document order. The root node does not generate a byte order mark,
1919 * XML declaration, nor anything from within the document type
1922 if (doc
->children
!= NULL
) {
1923 ret
= xmlC14NProcessNodeList(ctx
, doc
->children
);
1925 xmlC14NErrInternal("processing docs children list");
1926 xmlC14NFreeCtx(ctx
);
1932 * Flush buffer to get number of bytes written
1934 ret
= xmlOutputBufferFlush(buf
);
1936 xmlC14NErrInternal("flushing output buffer");
1937 xmlC14NFreeCtx(ctx
);
1944 xmlC14NFreeCtx(ctx
);
1950 * @doc: the XML document for canonization
1951 * @nodes: the nodes set to be included in the canonized image
1952 * or NULL if all document nodes should be included
1953 * @mode: the c14n mode (see @xmlC14NMode)
1954 * @inclusive_ns_prefixes: the list of inclusive namespace prefixes
1955 * ended with a NULL or NULL if there is no
1956 * inclusive namespaces (only for exclusive
1957 * canonicalization, ignored otherwise)
1958 * @with_comments: include comments in the result (!=0) or not (==0)
1959 * @buf: the output buffer to store canonical XML; this
1960 * buffer MUST have encoder==NULL because C14N requires
1963 * Dumps the canonized image of given XML document into the provided buffer.
1964 * For details see "Canonical XML" (http://www.w3.org/TR/xml-c14n) or
1965 * "Exclusive XML Canonicalization" (http://www.w3.org/TR/xml-exc-c14n)
1967 * Returns non-negative value on success or a negative value on fail
1970 xmlC14NDocSaveTo(xmlDocPtr doc
, xmlNodeSetPtr nodes
,
1971 int mode
, xmlChar
** inclusive_ns_prefixes
,
1972 int with_comments
, xmlOutputBufferPtr buf
) {
1973 return(xmlC14NExecute(doc
,
1974 (xmlC14NIsVisibleCallback
)xmlC14NIsNodeInNodeset
,
1977 inclusive_ns_prefixes
,
1984 * xmlC14NDocDumpMemory:
1985 * @doc: the XML document for canonization
1986 * @nodes: the nodes set to be included in the canonized image
1987 * or NULL if all document nodes should be included
1988 * @mode: the c14n mode (see @xmlC14NMode)
1989 * @inclusive_ns_prefixes: the list of inclusive namespace prefixes
1990 * ended with a NULL or NULL if there is no
1991 * inclusive namespaces (only for exclusive
1992 * canonicalization, ignored otherwise)
1993 * @with_comments: include comments in the result (!=0) or not (==0)
1994 * @doc_txt_ptr: the memory pointer for allocated canonical XML text;
1995 * the caller of this functions is responsible for calling
1996 * xmlFree() to free allocated memory
1998 * Dumps the canonized image of given XML document into memory.
1999 * For details see "Canonical XML" (http://www.w3.org/TR/xml-c14n) or
2000 * "Exclusive XML Canonicalization" (http://www.w3.org/TR/xml-exc-c14n)
2002 * Returns the number of bytes written on success or a negative value on fail
2005 xmlC14NDocDumpMemory(xmlDocPtr doc
, xmlNodeSetPtr nodes
,
2006 int mode
, xmlChar
** inclusive_ns_prefixes
,
2007 int with_comments
, xmlChar
** doc_txt_ptr
)
2010 xmlOutputBufferPtr buf
;
2012 if (doc_txt_ptr
== NULL
) {
2013 xmlC14NErrParam("dumping doc to memory");
2017 *doc_txt_ptr
= NULL
;
2020 * create memory buffer with UTF8 (default) encoding
2022 buf
= xmlAllocOutputBuffer(NULL
);
2024 xmlC14NErrMemory("creating output buffer");
2029 * canonize document and write to buffer
2031 ret
= xmlC14NDocSaveTo(doc
, nodes
, mode
, inclusive_ns_prefixes
,
2032 with_comments
, buf
);
2034 xmlC14NErrInternal("saving doc to output buffer");
2035 (void) xmlOutputBufferClose(buf
);
2039 ret
= xmlBufUse(buf
->buffer
);
2041 *doc_txt_ptr
= xmlStrndup(xmlBufContent(buf
->buffer
), ret
);
2043 (void) xmlOutputBufferClose(buf
);
2045 if ((*doc_txt_ptr
== NULL
) && (ret
> 0)) {
2046 xmlC14NErrMemory("coping canonicanized document");
2054 * @doc: the XML document for canonization
2055 * @nodes: the nodes set to be included in the canonized image
2056 * or NULL if all document nodes should be included
2057 * @mode: the c14n mode (see @xmlC14NMode)
2058 * @inclusive_ns_prefixes: the list of inclusive namespace prefixes
2059 * ended with a NULL or NULL if there is no
2060 * inclusive namespaces (only for exclusive
2061 * canonicalization, ignored otherwise)
2062 * @with_comments: include comments in the result (!=0) or not (==0)
2063 * @filename: the filename to store canonical XML image
2064 * @compression: the compression level (zlib requred):
2065 * -1 - libxml default,
2067 * >0 - compression level
2069 * Dumps the canonized image of given XML document into the file.
2070 * For details see "Canonical XML" (http://www.w3.org/TR/xml-c14n) or
2071 * "Exclusive XML Canonicalization" (http://www.w3.org/TR/xml-exc-c14n)
2073 * Returns the number of bytes written success or a negative value on fail
2076 xmlC14NDocSave(xmlDocPtr doc
, xmlNodeSetPtr nodes
,
2077 int mode
, xmlChar
** inclusive_ns_prefixes
,
2078 int with_comments
, const char *filename
, int compression
)
2080 xmlOutputBufferPtr buf
;
2083 if (filename
== NULL
) {
2084 xmlC14NErrParam("saving doc");
2088 if (compression
< 0)
2089 compression
= xmlGetCompressMode();
2093 * save the content to a temp buffer, use default UTF8 encoding.
2095 buf
= xmlOutputBufferCreateFilename(filename
, NULL
, compression
);
2097 xmlC14NErrInternal("creating temporary filename");
2102 * canonize document and write to buffer
2104 ret
= xmlC14NDocSaveTo(doc
, nodes
, mode
, inclusive_ns_prefixes
,
2105 with_comments
, buf
);
2107 xmlC14NErrInternal("cannicanize document to buffer");
2108 (void) xmlOutputBufferClose(buf
);
2113 * get the numbers of bytes written
2115 ret
= xmlOutputBufferClose(buf
);
2122 * Macro used to grow the current buffer.
2124 #define growBufferReentrant() { \
2126 buffer = (xmlChar *) \
2127 xmlRealloc(buffer, buffer_size * sizeof(xmlChar)); \
2128 if (buffer == NULL) { \
2129 xmlC14NErrMemory("growing buffer"); \
2135 * xmlC11NNormalizeString:
2136 * @input: the input string
2137 * @mode: the normalization mode (attribute, comment, PI or text)
2139 * Converts a string to a canonical (normalized) format. The code is stolen
2140 * from xmlEncodeEntitiesReentrant(). Added normalization of \x09, \x0a, \x0A
2141 * and the @mode parameter
2143 * Returns a normalized string (caller is responsible for calling xmlFree())
2144 * or NULL if an error occurs
2147 xmlC11NNormalizeString(const xmlChar
* input
,
2148 xmlC14NNormalizationMode mode
)
2150 const xmlChar
*cur
= input
;
2151 xmlChar
*buffer
= NULL
;
2152 xmlChar
*out
= NULL
;
2153 int buffer_size
= 0;
2159 * allocate an translation buffer.
2162 buffer
= (xmlChar
*) xmlMallocAtomic(buffer_size
* sizeof(xmlChar
));
2163 if (buffer
== NULL
) {
2164 xmlC14NErrMemory("allocating buffer");
2169 while (*cur
!= '\0') {
2170 if ((out
- buffer
) > (buffer_size
- 10)) {
2171 int indx
= out
- buffer
;
2173 growBufferReentrant();
2174 out
= &buffer
[indx
];
2177 if ((*cur
== '<') && ((mode
== XMLC14N_NORMALIZE_ATTR
) ||
2178 (mode
== XMLC14N_NORMALIZE_TEXT
))) {
2183 } else if ((*cur
== '>') && (mode
== XMLC14N_NORMALIZE_TEXT
)) {
2188 } else if ((*cur
== '&') && ((mode
== XMLC14N_NORMALIZE_ATTR
) ||
2189 (mode
== XMLC14N_NORMALIZE_TEXT
))) {
2195 } else if ((*cur
== '"') && (mode
== XMLC14N_NORMALIZE_ATTR
)) {
2202 } else if ((*cur
== '\x09') && (mode
== XMLC14N_NORMALIZE_ATTR
)) {
2208 } else if ((*cur
== '\x0A') && (mode
== XMLC14N_NORMALIZE_ATTR
)) {
2214 } else if ((*cur
== '\x0D') && ((mode
== XMLC14N_NORMALIZE_ATTR
) ||
2215 (mode
== XMLC14N_NORMALIZE_TEXT
) ||
2216 (mode
== XMLC14N_NORMALIZE_COMMENT
) ||
2217 (mode
== XMLC14N_NORMALIZE_PI
))) {
2225 * Works because on UTF-8, all extended sequences cannot
2226 * result in bytes in the ASCII range.
2235 #endif /* LIBXML_OUTPUT_ENABLED */
2237 #include "elfgcchack.h"
2238 #endif /* LIBXML_C14N_ENABLED */