use strict; use HTML::TokeParser my $filepath = "c:/folder/file.html"; my $stream = HTML::TokeParser -> new($filepath); while (my $token = $stream -> get_token()){ print "PDF link!\n" if $token -> [2] -> {'href'} =~ m/\.pdf/; }