Discount in current Debian unstable turns the IURI href into a URI
by encoding the Unicode as UTF-8 and %-escaping each byte.
That is valid, and matches Wikipedia's expectations, but was breaking
this test for me.
It would also be entirely valid (and lead to equivalent parsing) if the
ö was represented as ö, ö or ö in the text and/or the href.
subtest 'Text::Textile apparently double-escapes HTML entities in hrefs' => sub {
my $text = q{Gödel, Escher, Bach};
subtest 'Text::Textile apparently double-escapes HTML entities in hrefs' => sub {
my $text = q{Gödel, Escher, Bach};
+ my $text_ok = qr{G(?:ö|ö|ö|&#x[fF]6;)del, Escher, Bach};
my $href = q{https://en.wikipedia.org/wiki/Gödel,_Escher,_Bach};
my $href = q{https://en.wikipedia.org/wiki/Gödel,_Escher,_Bach};
- my $good = qq{<p><a href="$href">$text</a></p>};
+ my $href_ok = qr{https://en\.wikipedia\.org/wiki/G(?:ö|ö|ö|&#x[fF]6|%[cC]3%[bB]6)del,_Escher,_Bach};
+ my $good = qr{<p><a href="$href_ok">$text_ok</a></p>};
chomp(my $mdwn_html = IkiWiki::Plugin::mdwn::htmlize(
content => qq{[$text]($href)},
));
chomp(my $mdwn_html = IkiWiki::Plugin::mdwn::htmlize(
content => qq{[$text]($href)},
));
+ like($mdwn_html, $good);
chomp(my $txtl_html = IkiWiki::Plugin::textile::htmlize(
content => qq{"$text":$href},
));
TODO: {
local $TODO = "Text::Textile double-escapes the href";
chomp(my $txtl_html = IkiWiki::Plugin::textile::htmlize(
content => qq{"$text":$href},
));
TODO: {
local $TODO = "Text::Textile double-escapes the href";
- is($txtl_html, $good);
- isnt($txtl_html, q{<p><a href="https://en.wikipedia.org/wiki/G&ouml;del,_Escher,_Bach">Gödel, Escher, Bach</a></p>});
+ like($txtl_html, $good);
+ unlike($txtl_html, qr{<p><a href="https://en\.wikipedia\.org/wiki/G&ouml;del,_Escher,_Bach">Gödel, Escher, Bach</a></p>}i);