1
0
mirror of https://github.com/ytdl-org/youtube-dl.git synced 2025-01-18 01:16:42 +01:00

[nuvid] Add new extractor

This commit is contained in:
hojel 2014-05-12 03:48:40 -07:00
parent e399853d0c
commit 749fe60c1e
2 changed files with 40 additions and 0 deletions

View File

@ -194,6 +194,7 @@ from .nowvideo import NowVideoIE
from .nrk import NRKIE
from .ntv import NTVIE
from .nytimes import NYTimesIE
from .nuvid import NuvidIE
from .oe1 import OE1IE
from .ooyala import OoyalaIE
from .orf import ORFIE

View File

@ -0,0 +1,39 @@
import re
from .common import InfoExtractor
class NuvidIE(InfoExtractor):
_VALID_URL = r'^https?://(?:www|m)\.nuvid\.com/video/(?P<videoid>\d+)'
_TEST = {
u'url': u'http://m.nuvid.com/video/1310741/',
u'file': u'1310741.mp4',
u'md5': u'eab207b7ac4fccfb4e23c86201f11277',
u'info_dict': {
u"title": u"Horny babes show their awesome bodeis and",
u"age_limit": 18,
}
}
def _real_extract(self, url):
mobj = re.match(self._VALID_URL, url)
video_id = mobj.group('videoid')
# Get webpage content
murl = url.replace('//www.', '//m.')
webpage = self._download_webpage(murl, video_id)
video_title = self._html_search_regex(r'<div class="title">\s+<h2[^>]*>([^<]+)</h2>', webpage, 'video_title').strip()
video_url = 'http://m.nuvid.com'+self._html_search_regex(r'href="(/mp4/[^"]+)"[^>]*data-link_type="mp4"', webpage, 'video_url')
video_thumb = self._html_search_regex(r'href="(/thumbs/[^"]+)"[^>]*data-link_type="thumbs"', webpage, 'video_thumb')
info = {'id': video_id,
'url': video_url,
'title': video_title,
'thumbnail': video_thumb,
'ext': 'mp4',
'age_limit': 18}
return [info]