[bpb] Fix extraction and update tests
This commit is contained in:
		| @@ -1,7 +1,13 @@ | |||||||
| # coding: utf-8 | # coding: utf-8 | ||||||
| from __future__ import unicode_literals | from __future__ import unicode_literals | ||||||
|  |  | ||||||
|  | import re | ||||||
|  |  | ||||||
| from .common import InfoExtractor | from .common import InfoExtractor | ||||||
|  | from ..utils import ( | ||||||
|  |     js_to_json, | ||||||
|  |     determine_ext, | ||||||
|  | ) | ||||||
|  |  | ||||||
|  |  | ||||||
| class BpbIE(InfoExtractor): | class BpbIE(InfoExtractor): | ||||||
| @@ -10,7 +16,8 @@ class BpbIE(InfoExtractor): | |||||||
|  |  | ||||||
|     _TEST = { |     _TEST = { | ||||||
|         'url': 'http://www.bpb.de/mediathek/297/joachim-gauck-zu-1989-und-die-erinnerung-an-die-ddr', |         'url': 'http://www.bpb.de/mediathek/297/joachim-gauck-zu-1989-und-die-erinnerung-an-die-ddr', | ||||||
|         'md5': '0792086e8e2bfbac9cdf27835d5f2093', |         # md5 fails in Python 2.6 due to buggy server response and wrong handling of urllib2 | ||||||
|  |         'md5': 'c4f84c8a8044ca9ff68bb8441d300b3f', | ||||||
|         'info_dict': { |         'info_dict': { | ||||||
|             'id': '297', |             'id': '297', | ||||||
|             'ext': 'mp4', |             'ext': 'mp4', | ||||||
| @@ -25,13 +32,26 @@ class BpbIE(InfoExtractor): | |||||||
|  |  | ||||||
|         title = self._html_search_regex( |         title = self._html_search_regex( | ||||||
|             r'<h2 class="white">(.*?)</h2>', webpage, 'title') |             r'<h2 class="white">(.*?)</h2>', webpage, 'title') | ||||||
|         video_url = self._html_search_regex( |         video_info_dicts = re.findall( | ||||||
|             r'(http://film\.bpb\.de/player/dokument_[0-9]+\.mp4)', |             r"({\s*src:\s*'http://film\.bpb\.de/[^}]+})", webpage) | ||||||
|             webpage, 'video URL') |  | ||||||
|  |         formats = [] | ||||||
|  |         for video_info in video_info_dicts: | ||||||
|  |             video_info = self._parse_json(video_info, video_id, transform_source=js_to_json) | ||||||
|  |             quality = video_info['quality'] | ||||||
|  |             video_url = video_info['src'] | ||||||
|  |             formats.append({ | ||||||
|  |                 'url': video_url, | ||||||
|  |                 'preference': 10 if quality == 'high' else 0, | ||||||
|  |                 'format_note': quality, | ||||||
|  |                 'format_id': '%s-%s' % (quality, determine_ext(video_url)), | ||||||
|  |             }) | ||||||
|  |  | ||||||
|  |         self._sort_formats(formats) | ||||||
|  |  | ||||||
|         return { |         return { | ||||||
|             'id': video_id, |             'id': video_id, | ||||||
|             'url': video_url, |             'formats': formats, | ||||||
|             'title': title, |             'title': title, | ||||||
|             'description': self._og_search_description(webpage), |             'description': self._og_search_description(webpage), | ||||||
|         } |         } | ||||||
|   | |||||||
		Reference in New Issue
	
	Block a user