Do not escape double quoutes inside raw_text elements
This is not necessary and breaks tokenization compatibility.
Change-Id: Ib43733cf7264ee07b010a3478e8c4b728f7bd708
diff --git a/t/tei.t b/t/tei.t
index 94f7577..69b4ee1 100644
--- a/t/tei.t
+++ b/t/tei.t
@@ -9,7 +9,7 @@
use Test::KorAP::XML::TEI qw!korap_tempfile test_tei2korapxml!;
-use_ok('KorAP::XML::TEI', 'remove_xml_comments', 'escape_xml');
+use_ok('KorAP::XML::TEI', 'remove_xml_comments', 'escape_xml', 'escape_xml_minimal');
subtest 'remove_xml_comments' => sub {
my ($fh, $filename) = korap_tempfile('tei');
@@ -87,5 +87,31 @@
);
};
+subtest 'escape_xml_minimal' => sub {
+ is(
+ escape_xml_minimal('"""'),
+ '"""'
+ );
+
+ is(
+ escape_xml_minimal('&&&'),
+ '&&&'
+ );
+
+ is(
+ escape_xml_minimal('<<<'),
+ '<<<'
+ );
+
+ is(
+ escape_xml_minimal('>>>'),
+ '>>>'
+ );
+
+ is(
+ escape_xml_minimal('<tag att1="foo" att2="bar">C&A</tag>'),
+ '<tag att1="foo" att2="bar">C&A</tag>'
+ );
+};
done_testing;