From c3e6b7e4672eb2eb44262f0ccb7025ea53b0dce4 Mon Sep 17 00:00:00 2001 From: Trey Evans Date: Sun, 3 Apr 2022 10:59:23 -0400 Subject: [PATCH] Correct C implementation issues for #2494. --- ext/nokogiri/xml_node.c | 29 ++++++++++++++++++++++++----- test/xml/test_namespace.rb | 22 ++++++++++++++++++++++ 2 files changed, 46 insertions(+), 5 deletions(-) diff --git a/ext/nokogiri/xml_node.c b/ext/nokogiri/xml_node.c index 1728c4d4156..8cba0ddd8f9 100644 --- a/ext/nokogiri/xml_node.c +++ b/ext/nokogiri/xml_node.c @@ -64,10 +64,16 @@ static const rb_data_type_t nokogiri_node_type = { }; static void -relink_namespace(xmlNodePtr reparented) +relink_namespace(xmlNodePtr reparented, int reconcile_namespaces) { xmlNodePtr child; xmlAttrPtr attr; + xmlNsPtr possible_collision_ns; + int ns_collision; + + if (reconcile_namespaces && reparented->doc) { + xmlReconciliateNs(reparented->doc, reparented); + } if (reparented->type != XML_ATTRIBUTE_NODE && reparented->type != XML_ELEMENT_NODE) { return; } @@ -118,9 +124,16 @@ relink_namespace(xmlNodePtr reparented) reparented->parent, curr->href ); + /* Track and check for a namespace which might be 'squatting' on a + * the same prefix but a different href. */ + ns_collision = 0; + possible_collision_ns = xmlSearchNs(reparented->doc, reparented->parent, curr->prefix); + if (possible_collision_ns && !xmlStrEqual(curr->href, possible_collision_ns->href)) { + ns_collision = 1; + } /* If we find the namespace is already declared, remove it from this * definition list. */ - if (ns && ns != curr && xmlStrEqual(ns->prefix, curr->prefix)) { + if (ns && ns != curr && !ns_collision && xmlStrEqual(ns->prefix, curr->prefix)) { if (prev) { prev->next = curr->next; } else { @@ -161,14 +174,14 @@ relink_namespace(xmlNodePtr reparented) /* their namespaces are reparented as well. */ child = reparented->children; while (NULL != child) { - relink_namespace(child); + relink_namespace(child, 0); child = child->next; } if (reparented->type == XML_ELEMENT_NODE) { attr = reparented->properties; while (NULL != attr) { - relink_namespace((xmlNodePtr)attr); + relink_namespace((xmlNodePtr)attr, 0); attr = attr->next; } } @@ -218,6 +231,7 @@ reparent_node_with(VALUE pivot_obj, VALUE reparentee_obj, pivot_reparentee_func { VALUE reparented_obj ; xmlNodePtr reparentee, original_reparentee, pivot, reparented, next_text, new_next_text, parent ; + int reconcile_ns = 1; int original_ns_prefix_is_default = 0 ; if (!rb_obj_is_kind_of(reparentee_obj, cNokogiriXmlNode)) { @@ -227,6 +241,11 @@ reparent_node_with(VALUE pivot_obj, VALUE reparentee_obj, pivot_reparentee_func rb_raise(rb_eArgError, "node must be a Nokogiri::XML::Node"); } + // Don't reconcile children of fragments. + if (rb_obj_is_kind_of(pivot_obj, cNokogiriXmlDocumentFragment)) { + reconcile_ns = 0; + } + Noko_Node_Get_Struct(reparentee_obj, xmlNode, reparentee); Noko_Node_Get_Struct(pivot_obj, xmlNode, pivot); @@ -408,7 +427,7 @@ reparent_node_with(VALUE pivot_obj, VALUE reparentee_obj, pivot_reparentee_func /* if we've created a cycle, raise an exception */ raise_if_ancestor_of_self(reparented); - relink_namespace(reparented); + relink_namespace(reparented, reconcile_ns); return reparented_obj ; } diff --git a/test/xml/test_namespace.rb b/test/xml/test_namespace.rb index 74ee6d100a5..4f3d5ae5937 100644 --- a/test/xml/test_namespace.rb +++ b/test/xml/test_namespace.rb @@ -93,6 +93,28 @@ def test_maintain_element_namespaces_in_urn assert_equal("urn:xmpp:foospec:barfoo", child.namespace.href) assert_empty(child.attributes) end + + def test_maintain_element_namespaces_with_abbreviation_squating + root_namespace_href = "urn:root_namespace" + child1_namespace_href = "urn:child1_namespace" + doc = Nokogiri::XML(<<-eoxml) + + + + + eoxml + + child2 = doc.at_xpath("//ns1:child2", { "ns1" => root_namespace_href }) + child1 = doc.at_xpath("//ns2:child1", { "ns2" => child1_namespace_href }) + child1.add_child(child2) + new_xml = doc.to_xml + + new_doc = Nokogiri::XML(new_xml) + new_child1 = new_doc.at_xpath("//ns2:child1", { "ns2" => child1_namespace_href }) + new_child2 = new_child1.first_element_child + new_child2_ns_href = new_child2.namespace.href + assert_equal(root_namespace_href, new_child2_ns_href) + end end end end