Add support for drtuber.com

This commit is contained in:
peugeot 2014-09-01 20:12:51 +02:00
parent 07e7dc4bdc
commit d740f7e16f
2 changed files with 49 additions and 0 deletions

View file

@ -70,6 +70,7 @@ from .daum import DaumIE
from .dfb import DFBIE from .dfb import DFBIE
from .dotsub import DotsubIE from .dotsub import DotsubIE
from .dreisat import DreiSatIE from .dreisat import DreiSatIE
from .drtuber import DrTuberIE
from .drtv import DRTVIE from .drtv import DRTVIE
from .dump import DumpIE from .dump import DumpIE
from .defense import DefenseGouvFrIE from .defense import DefenseGouvFrIE

View file

@ -0,0 +1,48 @@
from __future__ import unicode_literals
import re
from .common import InfoExtractor
class DrTuberIE(InfoExtractor):
_VALID_URL = r'https?://(?:www\.)?drtuber\.com/video/(?P<id>\d+)/(?P<title_dash>[\w-]+)'
_TEST = {
'url': 'http://www.drtuber.com/video/1740434/hot-perky-blonde-naked-golf',
'md5': '93e680cf2536ad0dfb7e74d94a89facd',
'info_dict': {
'id': '1740434',
'ext': 'mp4',
'title': 'Hot Perky Blonde Naked Golf',
'categories': list, # NSFW
'thumbnail': 're:https?://.*\.jpg$',
}
}
def _real_extract(self, url):
mobj = re.match(self._VALID_URL, url)
video_id = mobj.group('id')
webpage = self._download_webpage(url, video_id)
video_url = self._html_search_regex(
r'<source src="([^"]+)"', webpage, 'video URL')
title = self._html_search_regex(
r'<title>([^<]+)\s*-\s*Free', webpage, 'title')
thumbnail = self._html_search_regex(
r'poster="([^"]+)"',
webpage, 'thumbnail', fatal=False)
categories_str = self._html_search_regex(
r'<meta name="keywords" content="([^"]+)"', webpage, 'categories', fatal=False)
categories = categories_str.split(' ')
return {
'id': video_id,
'url': video_url,
'title': title,
'thumbnail': thumbnail,
'categories': categories,
}