#! /usr/bin/env perl use warnings; use strict; use Carp; sub utility::get_title; # A complete screen-scraper and RSS generator # adapted from XML::RSS::SimpleGen POD use strict; use XML::RSS::SimpleGen; my $url = q; rss_new( $url, "YAPAC", "Yet Another Perl (Advent) Calendar" ); rss_language( 'en' ); rss_webmaster( 'jpierce@cpan.org' ); # image is not supposed to be a favicon, but a GIF, skip for now. # rss_image("http://yourpath.com/icon.gif",32,32); rss_daily(); get_url( $url ); my @pages; # List of things to process while( # was # m{

\s*(.*?)\s*

\s*(.*?)new(); my $date = shift || croak "get_title requires arg of page name"; my $content = get( $_ = "http://web.mit.edu/belg4mit/www/$date"); unless( $content ) { warn("No content for: $_\n"); return; } $header->parse($content); return $header->header('Title'); }