X-Git-Url: https://git.camperquake.de/gitweb.cgi?a=blobdiff_plain;f=videosite%2FZeroPunctuationGrabber.pm;h=241f4b67c0368ee48a84cfcaa55918165a70068b;hb=17bca93d2b471f5f099a4046297159a029989430;hp=2a938407e13268f005cb625356fd988a17cb59cd;hpb=a018c395f1f0d469b199512ded838d4f6f6061b7;p=videosite.git diff --git a/videosite/ZeroPunctuationGrabber.pm b/videosite/ZeroPunctuationGrabber.pm index 2a93840..241f4b6 100644 --- a/videosite/ZeroPunctuationGrabber.pm +++ b/videosite/ZeroPunctuationGrabber.pm @@ -3,28 +3,27 @@ # # Grabber for www.escapistmagazine.com/articles/view/editorials/zeropunctuation -package ZeroPunctuationGrabber; +package videosite::ZeroPunctuationGrabber; -use GrabberBase; -@ISA = qw(GrabberBase); +use videosite::GrabberBase; +@ISA = qw(videosite::GrabberBase); -use LWP::Simple qw(!get); use HTML::TokeParser; use Data::Dumper; +use videosite::JSArrayParser; use strict; sub new { my $class = shift; - my $self = $class->SUPER::new(); - - $self->{'NAME'} = 'zeropunctuation'; - $self->{'PATTERNS'} = ['(http://www.escapistmagazine.com/articles/view/editorials/zeropunctuation/([-A-Za-z0-9]+))']; - - bless($self, $class); - $self->_prepare_parameters(); - - return $self; + my $self = $class->SUPER::new( + NAME => 'zeropunctuation', + _SELFTESTURL => 'http://www.escapistmagazine.com/videos/view/zero-punctuation/5346-Amy', + _SELFTESTTITLE =>'Amy', + PATTERNS => ['(http://www.escapistmagazine.com/videos/view/zero-punctuation/([-A-Za-z0-9]+))'], + ); + + return bless($self, $class); } sub _parse { @@ -35,6 +34,9 @@ sub _parse { my $metadata = {}; my $p; my $e; + my $j; + my $jsp; + my $r; $url =~ m|$pattern|; $url = $1; @@ -46,23 +48,40 @@ sub _parse { $metadata->{'TITLE'} = undef; $metadata->{'DLURL'} = undef; - unless(defined($content = LWP::Simple::get($url))) { + unless(defined($content = $self->simple_get($url))) { $self->error('Could not download %s', $url); return undef; } $p = HTML::TokeParser->new(\$content); - # Look for the title - if ($p->get_tag('title')) { - $metadata->{'TITLE'} = $p->get_text(); - $metadata->{'TITLE'} =~ s/^The Escapist : Zero Punctuation: (.*)$/$1/im; + while ($e = $p->get_tag('div', 'param')) { + if (($e->[0] eq 'param') and exists($e->[1]->{name}) and ($e->[1]->{name} eq 'flashvars')) { + my %r = map { $self->decode_hexurl($_) } split(/[&=]/, $e->[1]->{value}); + + unless(exists($r{config})) { + $self->error("config URL not found in flashvars"); + return undef; + } + + $j = $r{config}; + } elsif (($e->[0] eq 'div') and exists($e->[1]->{itemprop}) and ($e->[1]->{itemprop} eq 'name')) { + $metadata->{'TITLE'} = $p->get_phrase(); + } } - while ($e = $p->get_tag('script')) { - my $c = $p->get_text(); - if ($c =~ m|var vars = \{file:\x27([^\x27]+)\x27|) { - $metadata->{'DLURL'} = 'http://' . $1 . '_high.flv'; + unless(defined($content = $self->simple_get($j))) { + $self->error("Could not download %s", $j); + return undef; + } + + $jsp = videosite::JSArrayParser->new(); + $r = $jsp->parse($content); + + foreach (@{$r->{playlist}}) { + if ($_->{eventCategory} eq 'Video') { + $metadata->{'DLURL'} = $_->{url}; + last; } }