2 package IkiWiki::Plugin::htmlbalance;
4 # htmlbalance: Parse and re-serialize HTML to ensure balanced tags
6 # Copyright 2008 Simon McVittie <http://smcv.pseudorandom.co.uk/>
7 # Licensed under the GNU GPL, version 2, or any later version published by the
8 # Free Software Foundation
13 use HTML::TreeBuilder;
17 hook(type => "getsetup", id => "htmlbalance", call => \&getsetup);
18 hook(type => "sanitize", id => "htmlbalance", call => \&sanitize);
21 sub getsetup () { #{{{
29 sub sanitize (@) { #{{{
33 my $tree = HTML::TreeBuilder->new();
34 $tree->ignore_unknown(0);
35 $tree->ignore_ignorable_whitespace(0);
36 $tree->no_space_compacting(1);
38 $tree->store_comments(0);
39 $tree->store_declarations(0);
41 $tree->parse_content($params{content});
42 my @nodes = $tree->disembowel();
43 foreach my $node (@nodes) {
45 $ret .= $node->as_XML();
50 $ret .= encode_entities($node);