diff --git a/patches/libxml2/0012-parser-Fix-crash-in-xmlParseInNodeContext-with-HTML.patch b/patches/libxml2/0012-parser-Fix-crash-in-xmlParseInNodeContext-with-HTML.patch new file mode 100644 index 0000000000..56e8851784 --- /dev/null +++ b/patches/libxml2/0012-parser-Fix-crash-in-xmlParseInNodeContext-with-HTML.patch @@ -0,0 +1,33 @@ +From 95f2a17440568694a6df6a326c5b411e77597be2 Mon Sep 17 00:00:00 2001 +From: Nick Wellnhofer +Date: Tue, 30 Jan 2024 13:25:17 +0100 +Subject: [PATCH] parser: Fix crash in xmlParseInNodeContext with HTML + documents + +Ignore namespaces if we have an HTML document with namespaces added +manually. + +Fixes #672. +--- + parser.c | 4 +++- + 1 file changed, 3 insertions(+), 1 deletion(-) + +diff --git a/parser.c b/parser.c +index 1038d71b..f7842ed1 100644 +--- a/parser.c ++++ b/parser.c +@@ -12415,8 +12415,10 @@ xmlParseInNodeContext(xmlNodePtr node, const char *data, int datalen, + } + xmlAddChild(node, fake); + +- if (node->type == XML_ELEMENT_NODE) { ++ if (node->type == XML_ELEMENT_NODE) + nodePush(ctxt, node); ++ ++ if ((ctxt->html == 0) && (node->type == XML_ELEMENT_NODE)) { + /* + * initialize the SAX2 namespaces stack + */ +-- +2.42.0 + diff --git a/test/html5/test_api.rb b/test/html5/test_api.rb index 403287c7ee..0ff5957a34 100644 --- a/test/html5/test_api.rb +++ b/test/html5/test_api.rb @@ -238,6 +238,18 @@ def test_node_wrap_uses_parent_node_as_parsing_context_node assert_equal("select", el.parent.parent.name) end + def test_parse_in_context_of_foreign_namespace + # https://github.com/sparklemotion/nokogiri/issues/3112 + # https://gitlab.gnome.org/GNOME/libxml2/-/issues/672 + doc = Nokogiri::HTML5::Document.parse("") + math = doc.at_css("math") + + nodes = math.parse("mrow") # segfaults in libxml 2.12 before 95f2a174 + + assert_kind_of(Nokogiri::XML::NodeSet, nodes) + assert_equal(1, nodes.length) + end + describe Nokogiri::HTML5::Document do describe "#fragment" do it "parses text nodes in a `body` context" do