X-Git-Url: https://git.camperquake.de/gitweb.cgi?a=blobdiff_plain;f=videosite%2FDailyMotionGrabber.pm;h=65448824863918f1ba71549365a5533fa0a1908d;hb=1cfec45c0c1cac8fdebca4313c3bcfb3a9f1ab07;hp=66fb8a0adde558d93511a28630ff25b1902c5e5f;hpb=3eca2f3ce7592dd3c723c65c0934c81a37881eed;p=videosite.git diff --git a/videosite/DailyMotionGrabber.pm b/videosite/DailyMotionGrabber.pm index 66fb8a0..6544882 100644 --- a/videosite/DailyMotionGrabber.pm +++ b/videosite/DailyMotionGrabber.pm @@ -1,10 +1,15 @@ -package DailyMotionGrabber; +# Grabber for dailymotion.com +# +# (c) 2007 by Ralf Ertzinger +# licensed under GNU GPL v2 -use GrabberBase; -@ISA = qw(GrabberBase); +package videosite::DailyMotionGrabber; + +use videosite::GrabberBase; +@ISA = qw(videosite::GrabberBase); -use LWP::Simple qw(!get); use HTML::Parser; +use videosite::JSArrayParser; use Data::Dumper; use strict; @@ -18,6 +23,8 @@ sub new { bless($self, $class); + $self->_prepare_parameters(); + return $self; } @@ -38,11 +45,11 @@ sub _parse { $metadata->{'URL'} = $url; $metadata->{'ID'} = $2; $metadata->{'TYPE'} = 'video'; - $metadata->{'SOURCE'} = 'dailymotion'; + $metadata->{'SOURCE'} = $self->{'NAME'}; $metadata->{'TITLE'} = undef; $metadata->{'DLURL'} = undef; - unless(defined($content = LWP::Simple::get(sprintf('http://www.dailymotion.com/video/%s', $2)))) { + unless(defined($content = $self->simple_get(sprintf('http://www.dailymotion.com/video/%s', $2)))) { $self->error('Could not download %s', $url); return undef; } @@ -58,16 +65,51 @@ sub _parse { if ('meta' eq $e->[0]) { if ('title' eq $e->[1]->{'name'}) { $metadata->{'TITLE'} = $e->[1]->{'content'}; + $metadata->{'TITLE'} =~ s/^Dailymotion\s+-\s+//; + $metadata->{'TITLE'} =~ s/(?:\s+-\s+.*)?$//; } } } # Look for the download URL foreach $e (@text) { - if ($e->[0] =~ m|\.addVariable\("url", "([^\"]+)"|) { - my $decoded = $1; - $decoded =~ s/%(..)/chr(hex($1))/ge; - $metadata->{'DLURL'} = $decoded; + if ($e->[0] =~ m|\.addVariable\("sequence",\s*"([^\"]+)"|) { + my $sequence = $1; + my $jsp = videosite::JSArrayParser->new(); + my $l; + my $s; + + $sequence =~ s/%(..)/chr(hex($1))/ge; + $self->debug("Found sequence: %s", $sequence); + + $self->debug("Using %s to parse", ref($jsp)); + $sequence = $jsp->parse($sequence); + $self->debug(Dumper($sequence)); + + unless(defined($sequence)) { + $self->error("Found sequence, but could not parse"); + return undef; + } else { + $self->debug("Parsed sequence: %s", Dumper($sequence)); + + $l = $self->_fetch_layer($sequence, "root/layerList", "background/sequenceList", "main/layerList", "video/param"); + unless(defined($l)) { + $self->error("Could not find video layer"); + return undef; + } + + # Found video section + if (exists($l->{'videoPluginParameters'}->{'hdURL'})) { + $metadata->{'DLURL'} = $l->{'videoPluginParameters'}->{'hdURL'}; + } elsif (exists($l->{'videoPluginParameters'}->{'hqURL'})) { + $metadata->{'DLURL'} = $l->{'videoPluginParameters'}->{'hqURL'}; + } elsif (exists($l->{'videoPluginParameters'}->{'hqURL'})) { + $metadata->{'DLURL'} = $l->{'videoPluginParameters'}->{'sdURL'}; + } else { + $self->error("Video section found, but no URLs"); + return undef; + } + } } } @@ -79,4 +121,37 @@ sub _parse { return $metadata; } +sub _fetch_layer { + my $self = shift; + my $sequence = shift; + my $point = shift; + my $next; + my @points = @_; + my $l; + + $self->debug("Looking for %s in %s", $point, Dumper($sequence)); + + unless(defined($point)) { + $self->debug("Reached last point"); + return $sequence; + } + ($point, $next) = split(/\//, $point, 2); + + foreach (@{$sequence}) { + if (exists($_->{'name'}) and ($_->{'name'} eq $point)) { + if (exists($_->{$next})) { + $self->debug("Using %s in %s", $next, $point); + return $self->_fetch_layer($_->{$next}, @points); + } else { + $self->debug("%s found, but no %s", $point, $next); + return undef; + } + + } + } + + $self->debug("Could not find entry named %s", $point); + return undef; +} + 1;