use strict; use HTML::TokeParser::Simple; my $filepath = "c:/folder/file.html"; my $stream = HTML::TokeParser::Simple->new($filepath) or die $!; while (my $token = $stream->get_token){ next unless $token->is_start_tag('a'); print "PDF link!\n" if $token->get_attr('href') =~ m/\.pdf/; }