[imdb] Fix extraction

The paths to each format's page may have leading whitespace.
The height and the duration can't be extracted.
This commit is contained in:
Jaime Marquínez Ferrándiz 2013-12-06 20:26:55 +01:00
parent 0b6a9f639f
commit d349cd2240

View File

@ -21,7 +21,6 @@ class ImdbIE(InfoExtractor):
u'ext': u'mp4', u'ext': u'mp4',
u'title': u'Ice Age: Continental Drift Trailer (No. 2) - IMDb', u'title': u'Ice Age: Continental Drift Trailer (No. 2) - IMDb',
u'description': u'md5:9061c2219254e5d14e03c25c98e96a81', u'description': u'md5:9061c2219254e5d14e03c25c98e96a81',
u'duration': 151,
} }
} }
@ -35,6 +34,7 @@ def _real_extract(self, url):
flags=re.MULTILINE) flags=re.MULTILINE)
formats = [] formats = []
for f_id, f_path in available_formats: for f_id, f_path in available_formats:
f_path = f_path.strip()
format_page = self._download_webpage( format_page = self._download_webpage(
compat_urlparse.urljoin(url, f_path), compat_urlparse.urljoin(url, f_path),
u'Downloading info for %s format' % f_id) u'Downloading info for %s format' % f_id)
@ -46,7 +46,6 @@ def _real_extract(self, url):
formats.append({ formats.append({
'format_id': f_id, 'format_id': f_id,
'url': format_info['url'], 'url': format_info['url'],
'height': int(info['titleObject']['encoding']['selected'][:-1]),
}) })
return { return {
@ -55,5 +54,4 @@ def _real_extract(self, url):
'formats': formats, 'formats': formats,
'description': descr, 'description': descr,
'thumbnail': format_info['slate'], 'thumbnail': format_info['slate'],
'duration': int(info['titleObject']['title']['duration_seconds']),
} }