From 06718ca32510df74bbefe4e6428aa0d857ecb0ec Mon Sep 17 00:00:00 2001 From: Ralf Ertzinger Date: Sun, 27 Jan 2008 23:46:36 +0100 Subject: [PATCH] - Add spikedhumor grabber --- videosite/SpikedHumorGrabber.pm | 71 +++++++++++++++++++++++++++++++++++++++++ 1 file changed, 71 insertions(+) create mode 100644 videosite/SpikedHumorGrabber.pm diff --git a/videosite/SpikedHumorGrabber.pm b/videosite/SpikedHumorGrabber.pm new file mode 100644 index 0000000..9925a30 --- /dev/null +++ b/videosite/SpikedHumorGrabber.pm @@ -0,0 +1,71 @@ +# (c) 2007 by Ralf Ertzinger +# licensed under GNU GPL v2 +# +# Grabber for spikedhumor.com + +package SpikedHumorGrabber; + +use GrabberBase; +@ISA = qw(GrabberBase); + +use LWP::Simple qw(!get); +use XML::Simple; +use Data::Dumper; + +use strict; + +sub new { + my $class = shift; + my $self = $class->SUPER::new(); + + $self->{'NAME'} = 'spikedhumor'; + $self->{'PATTERNS'} = ['(http://(?:[-a-zA-Z0-9_.]+\.)*spikedhumor.com/articles/(\d+)(?:/.*)*)']; + + bless($self, $class); + $self->_prepare_parameters(); + + return $self; +} + +sub _parse { + my $self = shift; + my $url = shift; + my $pattern = shift; + my $content; + my $metadata = {}; + my $p = XML::Simple->new(); + my $t; + + $url =~ m|$pattern|; + $url = $1; + + $metadata->{'URL'} = $url; + $metadata->{'ID'} = $2; + $metadata->{'TYPE'} = 'video'; + $metadata->{'SOURCE'} = $self->{'NAME'}; + $metadata->{'TITLE'} = undef; + $metadata->{'DLURL'} = undef; + + # Get the XML file containing the video metadata + unless(defined($content = LWP::Simple::get(sprintf('http://www.spikedhumor.com/playxml/%s/data.xml', $2)))) { + $self->error('Could not download XML metadata'); + return undef; + } + + unless(defined($t = $p->XMLin($content, KeepRoot => 1))) { + $self->error('Could not parse XML metadata'); + return undef; + } + + $metadata->{'DLURL'} = $t->{'playlist'}->{'listitem'}->{'url'}; + $metadata->{'TITLE'} = $t->{'playlist'}->{'listitem'}->{'name'}; + + unless(defined($metadata->{'DLURL'}) && defined($metadata->{'TITLE'})) { + $self->error('Could not extract download URL and title'); + return undef; + } + + return $metadata; +} + +1; -- 1.8.3.1