use XML::LibXML; my $p = XML::LibXML->new; $p->recover(1); my $d = do { local *STDOUT; local *STDERR; open STDOUT, ">/dev/null"; open STDERR, ">/dev/null"; $p->parse_html_file("http://www.example.com/some/url"); }; for my $p ($d->findnodes(q{//text()[string-length() > 100]})) { print $p->toString; }
In reply to Locate large HTML paragraphs with XML::LibXML by merlyn
| For: | Use: | ||
| & | & | ||
| < | < | ||
| > | > | ||
| [ | [ | ||
| ] | ] |