X-Git-Url: https://git.camperquake.de/gitweb.cgi?a=blobdiff_plain;f=videosite%2FDailyMotionGrabber.pm;h=981fef7b7c00cfb1a2841428872282b24dd4e8d8;hb=07ae64102eb11bca1a0c2b32599f96c6d2f9db70;hp=d08e71bc927f976a7772c742af4d3a0deb3d167a;hpb=b97a01912322f6ebccf2713c3bbbcc266f02c7b5;p=videosite.git diff --git a/videosite/DailyMotionGrabber.pm b/videosite/DailyMotionGrabber.pm index d08e71b..981fef7 100644 --- a/videosite/DailyMotionGrabber.pm +++ b/videosite/DailyMotionGrabber.pm @@ -1,14 +1,16 @@ +# Grabber for dailymotion.com # -# download strategy revised using -# http://www.kde-apps.org/content/show.php?content=41456 +# (c) 2007 by Ralf Ertzinger +# licensed under GNU GPL v2 -package DailyMotionGrabber; +package videosite::DailyMotionGrabber; -use GrabberBase; -@ISA = qw(GrabberBase); +use videosite::GrabberBase; +@ISA = qw(videosite::GrabberBase); use LWP::Simple qw(!get); use HTML::Parser; +use videosite::JSArrayParser; use Data::Dumper; use strict; @@ -17,11 +19,13 @@ sub new { my $class = shift; my $self = $class->SUPER::new(); - $self->{'NAME'} = 'youtube'; - $self->{'PATTERNS'} = ['(http://(?:[-a-zA-Z0-9_.]+\.)*.dailymotion.com/(?:[^/]+/)*video/([-a-zA-Z0-9_]+)']; + $self->{'NAME'} = 'dailymotion'; + $self->{'PATTERNS'} = ['(http://(?:[-a-zA-Z0-9_.]+\.)*dailymotion.com/(?:[^/]+/)*video/([-a-zA-Z0-9_]+))']; bless($self, $class); + $self->_prepare_parameters(); + return $self; } @@ -42,7 +46,7 @@ sub _parse { $metadata->{'URL'} = $url; $metadata->{'ID'} = $2; $metadata->{'TYPE'} = 'video'; - $metadata->{'SOURCE'} = 'dailymotion'; + $metadata->{'SOURCE'} = $self->{'NAME'}; $metadata->{'TITLE'} = undef; $metadata->{'DLURL'} = undef; @@ -62,14 +66,60 @@ sub _parse { if ('meta' eq $e->[0]) { if ('title' eq $e->[1]->{'name'}) { $metadata->{'TITLE'} = $e->[1]->{'content'}; + $metadata->{'TITLE'} =~ s/^Dailymotion\s+-\s+//; + $metadata->{'TITLE'} =~ s/(?:\s+-\s+.*)?$//; } } } # Look for the download URL foreach $e (@text) { - if ($e->[0] =~ m|\.add_variable("url", "([^\"]+)")|) { - $metadata->{'DLURL'} = $1; + if ($e->[0] =~ m|\.addVariable\("sequence",\s*"([^\"]+)"|) { + my $sequence = $1; + my $jsp = videosite::JSArrayParser->new(); + my $main; + my $s; + + $sequence =~ s/%(..)/chr(hex($1))/ge; + $self->debug("Found sequence: %s", $sequence); + + $self->debug("Using %s to parse", ref($jsp)); + $sequence = $jsp->parse($sequence); + $self->debug(Dumper($sequence)); + + unless(defined($sequence)) { + $self->error("Found sequence, but could not parse"); + return undef; + } else { + $self->debug("Parsed sequence: %s", Dumper($sequence)); + + foreach (@{$sequence}) { + if (exists($_->{'name'}) && ($_->{'name'} eq 'main')) { + # Found main section + $main = $_->{'layerList'}; + } + } + unless(defined($main)) { + $self->error("Could not find layerList[main]"); + return undef; + } + + foreach (@{$main}) { + if (exists($_->{'name'}) && ($_->{'name'} eq 'video')) { + # Found video section + if (exists($_->{'param'}->{'hdURL'})) { + $metadata->{'DLURL'} = $_->{'param'}->{'hdURL'}; + } elsif (exists($_->{'param'}->{'hqURL'})) { + $metadata->{'DLURL'} = $_->{'param'}->{'hqURL'}; + } elsif (exists($_->{'param'}->{'hqURL'})) { + $metadata->{'DLURL'} = $_->{'param'}->{'sdURL'}; + } else { + $self->error("Video section found, but no URLs"); + return undef; + } + } + } + } } }