[liveleak] add support for another embed type and restore original format extraction
This commit is contained in:
		| @@ -87,7 +87,7 @@ class LiveLeakIE(InfoExtractor): | |||||||
|     @staticmethod |     @staticmethod | ||||||
|     def _extract_urls(webpage): |     def _extract_urls(webpage): | ||||||
|         return re.findall( |         return re.findall( | ||||||
|             r'<iframe[^>]+src="(https?://(?:\w+\.)?liveleak\.com/ll_embed\?[^"]*[if]=[\w_]+[^"]+)"', |             r'<iframe[^>]+src="(https?://(?:\w+\.)?liveleak\.com/ll_embed\?[^"]*[ift]=[\w_]+[^"]+)"', | ||||||
|             webpage) |             webpage) | ||||||
|  |  | ||||||
|     def _real_extract(self, url): |     def _real_extract(self, url): | ||||||
| @@ -120,13 +120,27 @@ class LiveLeakIE(InfoExtractor): | |||||||
|             } |             } | ||||||
|  |  | ||||||
|         for idx, info_dict in enumerate(entries): |         for idx, info_dict in enumerate(entries): | ||||||
|  |             formats = [] | ||||||
|             for a_format in info_dict['formats']: |             for a_format in info_dict['formats']: | ||||||
|                 if not a_format.get('height'): |                 if not a_format.get('height'): | ||||||
|                     a_format['height'] = int_or_none(self._search_regex( |                     a_format['height'] = int_or_none(self._search_regex( | ||||||
|                         r'([0-9]+)p\.mp4', a_format['url'], 'height label', |                         r'([0-9]+)p\.mp4', a_format['url'], 'height label', | ||||||
|                         default=None)) |                         default=None)) | ||||||
|  |                 formats.append(a_format) | ||||||
|  |  | ||||||
|             self._sort_formats(info_dict['formats']) |                 # Removing '.*.mp4' gives the raw video, which is essentially | ||||||
|  |                 # the same video without the LiveLeak logo at the top (see | ||||||
|  |                 # https://github.com/rg3/youtube-dl/pull/4768) | ||||||
|  |                 orig_url = re.sub(r'\.mp4\.[^.]+', '', a_format['url']) | ||||||
|  |                 if a_format['url'] != orig_url: | ||||||
|  |                     format_id = a_format.get('format_id') | ||||||
|  |                     formats.append({ | ||||||
|  |                         'format_id': 'original' + ('-' + format_id if format_id else ''), | ||||||
|  |                         'url': orig_url, | ||||||
|  |                         'preference': 1, | ||||||
|  |                     }) | ||||||
|  |             self._sort_formats(formats) | ||||||
|  |             info_dict['formats'] = formats | ||||||
|  |  | ||||||
|             # Don't append entry ID for one-video pages to keep backward compatibility |             # Don't append entry ID for one-video pages to keep backward compatibility | ||||||
|             if len(entries) > 1: |             if len(entries) > 1: | ||||||
| @@ -146,7 +160,7 @@ class LiveLeakIE(InfoExtractor): | |||||||
|  |  | ||||||
|  |  | ||||||
| class LiveLeakEmbedIE(InfoExtractor): | class LiveLeakEmbedIE(InfoExtractor): | ||||||
|     _VALID_URL = r'https?://(?:www\.)?liveleak\.com/ll_embed\?.*?\b(?P<kind>[if])=(?P<id>[\w_]+)' |     _VALID_URL = r'https?://(?:www\.)?liveleak\.com/ll_embed\?.*?\b(?P<kind>[ift])=(?P<id>[\w_]+)' | ||||||
|  |  | ||||||
|     # See generic.py for actual test cases |     # See generic.py for actual test cases | ||||||
|     _TESTS = [{ |     _TESTS = [{ | ||||||
| @@ -158,15 +172,14 @@ class LiveLeakEmbedIE(InfoExtractor): | |||||||
|     }] |     }] | ||||||
|  |  | ||||||
|     def _real_extract(self, url): |     def _real_extract(self, url): | ||||||
|         mobj = re.match(self._VALID_URL, url) |         kind, video_id = re.match(self._VALID_URL, url).groups() | ||||||
|         kind, video_id = mobj.group('kind', 'id') |  | ||||||
|  |  | ||||||
|         if kind == 'f': |         if kind == 'f': | ||||||
|             webpage = self._download_webpage(url, video_id) |             webpage = self._download_webpage(url, video_id) | ||||||
|             liveleak_url = self._search_regex( |             liveleak_url = self._search_regex( | ||||||
|                 r'logourl\s*:\s*(?P<q1>[\'"])(?P<url>%s)(?P=q1)' % LiveLeakIE._VALID_URL, |                 r'(?:logourl\s*:\s*|window\.open\()(?P<q1>[\'"])(?P<url>%s)(?P=q1)' % LiveLeakIE._VALID_URL, | ||||||
|                 webpage, 'LiveLeak URL', group='url') |                 webpage, 'LiveLeak URL', group='url') | ||||||
|         elif kind == 'i': |         else: | ||||||
|             liveleak_url = 'http://www.liveleak.com/view?i=%s' % video_id |             liveleak_url = 'http://www.liveleak.com/view?%s=%s' % (kind, video_id) | ||||||
|  |  | ||||||
|         return self.url_result(liveleak_url, ie=LiveLeakIE.ie_key()) |         return self.url_result(liveleak_url, ie=LiveLeakIE.ie_key()) | ||||||
|   | |||||||
		Reference in New Issue
	
	Block a user