use HTML::TokeParser; use strict; local $/; my $lines = ; my $tok_par = HTML::TokeParser->new(\$lines); my $tok_inf = $tok_par->get_token ; my $tok_typ = shift @{$tok_inf}; print "Type: $tok_typ \n" ; my $title = $tok_par->get_text() || ""; print "Title: $title \n" ; __END__ egrave: è : eacute: é : rsquo: ’ : lsquo: ‘