in reply to Help with web crawling
use HTML::HTML5::Parser; my $uri = 'http://www.sec.gov/Archives/edgar/data/935226/00011442041 +1058092/0001144204-11-058092-index.htm'; my $xpath = '//*[@class="formGrouping" and ./*[@class="infoHead" and c +ontains(./text(), "Items")]]/*[@class="info"]'; my $item = HTML::HTML5::Parser -> load_html(location => $uri) -> findvalue($xpath); print $item, "\n";
|
|---|