use LWP::Simple qw(!head);
use LWP::UserAgent;
use HTML::LinkExtor;
use URI::URL;
my $ua = LWP::UserAgent->new;
my $p = HTML::LinkExtor->new;
$ua->timeout(3);
my $res = $ua->request(HTTP::Request->new(GET => $url),
sub {$p->parse($_[0])});
##################
# Retrieve information from our anony array
##################
for ($p->links) {
if (defined $_->[2]) {
push(@search, $_->[2]);
}
}
#################
# Take known URL-types and rebuild them
#################
foreach(@search)
{
if ($_ !~ /^http:\/\//gi)
{
if ($_ !~ /^#/g)
{
if ($_ !~ /mailto:/gi)
{
my $force_url = "$base$_";
push(@search_ready, "$force_url");
}
}
}
else
{
if ($_ =~ /^\#/g)
{
my $force_url = join("", $url, $_);
#print "$force_url
";
push(@search_ready, "$force_url");
}
else
{
#print "$_
";
push(@search_ready, "$_");
}
}
}