X-Git-Url: https://git.camperquake.de/gitweb.cgi?a=blobdiff_plain;f=videosite%2FBreakGrabber.pm;h=6bd77e1a5275c881e1e0d976157544737fda193d;hb=89e8775f8f880bd14731e4501d13a3d63fe5fcb5;hp=4870da8be995885e9499d422b7a7848d6efc160a;hpb=c9eaebd4eec29a38c2b89c581438ce94e32b1814;p=videosite.git diff --git a/videosite/BreakGrabber.pm b/videosite/BreakGrabber.pm index 4870da8..6bd77e1 100644 --- a/videosite/BreakGrabber.pm +++ b/videosite/BreakGrabber.pm @@ -3,29 +3,25 @@ # (c) 2007 by Ralf Ertzinger # licensed under GNU GPL v2 -package BreakGrabber; +package videosite::BreakGrabber; -use GrabberBase; -@ISA = qw(GrabberBase); +use videosite::GrabberBase; +@ISA = qw(videosite::GrabberBase); -use LWP::Simple qw(!get); -use HTML::Parser; +use videosite::HTMLHelper; use Data::Dumper; use strict; sub new { my $class = shift; - my $self = $class->SUPER::new(); + my $self = $class->SUPER::new( + NAME => 'break', + PATTERNS => ['(http://(?:[-a-zA-Z0-9_.]+\.)*break.com/index/([-a-zA-Z0-9_]+?)\.html)'], + @_, + ); - $self->{'NAME'} = 'break'; - $self->{'PATTERNS'} = ['(http://(?:[-a-zA-Z0-9_.]+\.)*break.com/index/([-a-zA-Z0-9_]+?)\.html)']; - - bless($self, $class); - - $self->_prepare_parameters(); - - return $self; + return bless($self, $class); } sub _parse { @@ -34,10 +30,8 @@ sub _parse { my $pattern = shift; my $content; my $metadata = {}; - my $p = HTML::Parser->new(api_version => 3); - my @accum; - my @text; - my $e; + my $p = videosite::HTMLHelper->new(); + my $n; $url =~ m|$pattern|; $url = $1; @@ -49,28 +43,20 @@ sub _parse { $metadata->{'TITLE'} = undef; $metadata->{'DLURL'} = undef; - unless(defined($content = LWP::Simple::get($1))) { + unless(defined($content = $p->load($1))) { $self->error('Could not download %s', $url); return undef; } - $p->handler(start => \@accum, "tagname, attr"); - $p->report_tags(qw(meta)); - $p->utf8_mode(1); - $p->parse($content); - - # Look for the title in the meta tags - foreach $e (@accum) { - if ('meta' eq $e->[0]) { - if ('embed_video_title' eq $e->[1]->{'name'}) { - $metadata->{'TITLE'} = $e->[1]->{'content'}; - } + $n = $p->findnodes('meta[@name="embed_video_title"]'); + if (defined($n)) { + $metadata->{'TITLE'} = $n->{'content'}; + } - if ('embed_video_thumb_url' eq $e->[1]->{'name'}) { - $metadata->{'DLURL'} = $e->[1]->{'content'}; - $metadata->{'DLURL'} =~ s/\.jpg$/\.flv/; - } - } + $n = $p->findnodes('meta[@name="embed_video_thumb_url"]'); + if (defined($n)) { + $metadata->{'DLURL'} = $n->{'content'}; + $metadata->{'DLURL'} =~ s/\.jpg$/\.flv/; } unless(defined($metadata->{'DLURL'}) && defined($metadata->{'TITLE'})) {