comment on

Here is my code.

The TODO part is where I have to put my code. But everything I read for XML::RSS::LibXML doesn't let me pull out "item" tag.

#!/usr/bin/perl
use File::Path; use Data::Dumper;
use LWP::UserAgent;
use XML::RSS::LibXML;
use POSIX qw(strftime);
use Time::HiRes qw(gettimeofday tv_interval);
my $client = LWP::UserAgent->new();
my ($fh, $feed, $feed_title, $count, $node);
my $rss = XML::RSS::LibXML->new;
my $website_name = "usnews";
my $url = "http://www.usnews.com/rss/health-news/index.rss";

$firstListing = 1;
while (1)
{
    if ( $website_name eq "" )
    { next; };

    print "polling: $website_name url: $url\n";
    $capture = $client->get("$url", ":content_file" => "/tmp/.rss_down
+load_file") || die"$!\n";
    $rss->parsefile('/tmp/.rss_download_file');

    print "channel: $rss->{channel}->{title}\n";
    @curListOfItems = ();
    foreach my $item (@{ $rss->{items} })
    {
        my $node_link = $item->{link};

        if (defined $node_link)
        {
            $curItem=$node_link ."\n";
            push (@curListOfItems, $curItem);
        }
    }
    if ($#prevListOfItems != -1 )
    {
        # @newlyAddedLinks will be latest in curListOfItems and not in
+ @prevListOfItems
        @newlyAddedLinks=grep!${{map{$_,1}@prevListOfItems}}{$_},@curL
+istOfItems;

        foreach my $l (@newlyAddedLinks)
        {
            my $fileName=getFileName();
            $fileName="/tmp/.$website_name\_${fileName}";
            my $capture = $client->get("$l", ":content_file" => "$file
+Name");
            # TODO: Pull out the current Item tag ( <item> .....</item
+> )
        }
        print "Getting1 $filename\n";
    }
    elsif ( $firstListing == 1)
    {
        print "Getting2 $filename\n";
        foreach my $l (@curListOfItems)
        {
            my $fileName=getFileName();
            $fileName="/tmp/.$website_name\_${fileName}";
            my $capture = $client->get("$l", ":content_file" => "$file
+Name");
            # TODO: Pull out the current Item tag ( <item> .....</item
+> )
        }
        $firstListing = 0;
    }
    @prevListOfItems = @curListOfItems;
    open OUT_FILE, "> /tmp/.$website_name" || die "could not open file
+ $!";
    print OUT_FILE "@prevListOfItems";
    close OUT_FILE;

    sleep 1;
}
sub getFileName
{
    my ($seconds, $microseconds) = gettimeofday();
    my $padded_usecs = sprintf ('%06d', $microseconds);
    my ($logType, $str1, $str2) = split ('\|',$LogElement);
    $todaysDate = strftime "%d", localtime;
    $currentDateTime = strftime "%Y:%m:%d:%H:%M:%S", localtime;
    ($Year,$Month,$Date,$Hour,$Minute,$Seconds) = split /:/, $currentD
+ateTime;
    $curYear = sprintf ('%04d', $Year);
    $curMonth = sprintf ('%02d', $Month);
    $curHour = sprintf ('%02d', $Hour);
    $curMinute = sprintf ('%02d', $Minute);
    $curDate = sprintf ('%02d', $Date);
    $curSec = sprintf ('%02d', $Seconds);
    my $fname = "${curYear}${curMonth}${curMonth}${curHour}${curMinute
+}${curSec}.html";
    return "$fname";

}
[download]

In reply to Re^2: Parsing ITEM Tag from RSS feed using XML::RSS::LibXML by mr_p
in thread Parsing ITEM Tag from RSS feed using XML::RSS::LibXML by mr_p

Posts are HTML formatted. Put <p> </p> tags around your paragraphs. Put <code> </code> tags around your code and data!

Titles consisting of a single word are discouraged, and in most cases are disallowed outright.

Read Where should I post X? if you're not absolutely sure you're posting in the right place.

Please read these before you post! —

Posts may use any of the Perl Monks Approved HTML tags:

a, abbr, b, big, blockquote, br, caption, center, col, colgroup, dd, del, details, div, dl, dt, em, font, h1, h2, h3, h4, h5, h6, hr, i, ins, li, ol, p, pre, readmore, small, span, spoiler, strike, strong, sub, summary, sup, table, tbody, td, tfoot, th, thead, tr, tt, u, ul, wbr

You may need to use entities for some characters, as follows. (Exception: Within code tags, you can put the characters literally.)

	For:		Use:
	&		`&`
	<		`<`
	>		`>`
	[		`[`
	]		`]`

Link using PerlMonks shortcuts! What shortcuts can I use for linking?

See Writeup Formatting Tips and other pages linked from there for more info.