#!/usr/bin/perl -w
use strict;
use HTML::TokeParser;
use LWP::Simple;
use URI;
print "Content-type: text/html\n\n";
my $filename = 'temp.html';
open FH, ">$filename";
print FH get("http://www.reuters.com/newsEarlierArticles.jhtml?type=businessNews");
close FH;
my $stream = HTML::TokeParser->new($filename)
|| die "Couldn't read HTML file $filename: $!";
while(my $token = $stream->get_token) {
if ($token->[0] eq 'S' and $token->[1] eq 'td' and
($token->[2]{'class'} || '') eq 'earlyHeadline') {
my(@next) = ($stream->get_token);
if ($next[0] and $next[0][0] eq 'S' and $next[0][1] eq 'a' and defined $next[0][2]{'href'} ) {
#early headline found for business section/grab a href portion
print URI->new_abs($next[0][2]{'href'}, 'http://www.reuters.com/'), "\n";
}
}
}