use XML::LibXML; my $parser = XML::LibXML->new(recover => 2); my $xmltree = $parser->parse_html_string($html); my @nodes = $xmltree->getElementsByTagName('h1');