#!/usr/bin/perl -- use strict; use warnings; use HTML::Parser; my $p = HTML::Parser->new( api_version => 3, default_h => [sub{print join ' | ', grep defined, @_,"\n" },"event,tag,text,"], # strict_names => 1, xml_mode => 1, ); $p->parse( ' hi
hello ' ); __END__ start_document | | start | boo | | start | foo | | start | shoo | | start | Moo | | start | COW | | end | /BOO | | text | | start | html | | start | body | | text | hi | start | br |
| text | | start | a | | text | hello | end | /a | | text | | start | boo | | start | foo | | start | shoo | | start | Moo | | start | COW | | end | /BOO | | text | | end | /body | | end | /html | |