From 34c869ca5b9ab72900869dc25d056cc496acef2b Mon Sep 17 00:00:00 2001 From: Daniel Heath Date: Tue, 29 Oct 2024 11:15:12 +1100 Subject: [PATCH] Valid HTML may contain unescaped `>` characters in text nodes --- lib/upmark/parser/xml.rb | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/lib/upmark/parser/xml.rb b/lib/upmark/parser/xml.rb index 01e8ce5..4fb130e 100644 --- a/lib/upmark/parser/xml.rb +++ b/lib/upmark/parser/xml.rb @@ -36,7 +36,7 @@ class XML < Parslet::Parser rule(:text) do match(/\A[\s\n\t ]+\Z/m).absent? >> # ignore entirely empty strings - match(/[^<>]/).repeat(1) + match(/[^<]/).repeat(1) end rule(:start_tag) do