Help for this page
require HTML::TokeParser; $p = HTML::TokeParser->new("output.xml") || ... open(FH, "output.xml"); print FH $p; close FH;
<greeting class="simple">Hello, world!