use strict; use HTML::Parser (); # Create parser object my $p = HTML::Parser->new( api_version => 3, start_h => [\&a_tag, "tag, attr"], ); $p->parse_file('c:/data/perl/script/volvo.html'); sub a_tag { my $tag = shift; return unless $tag eq 'a'; my $hashref = shift; return unless $hashref->{'href'}=~m|'CIS Report for (\d{2}/\d{2}/\d{4})|; my $date = $1; (my $file) = $hashref->{'href'}=~m|PopupInfo\('(.*pdf)|; print "$date: $file\n"; }