[chirbit] Fix extraction (Closes #10296)
This commit is contained in:
		| @@ -1,30 +1,33 @@ | |||||||
| # coding: utf-8 | # coding: utf-8 | ||||||
| from __future__ import unicode_literals | from __future__ import unicode_literals | ||||||
|  |  | ||||||
|  | import base64 | ||||||
|  |  | ||||||
| from .common import InfoExtractor | from .common import InfoExtractor | ||||||
| from ..utils import ( | from ..utils import parse_duration | ||||||
|     parse_duration, |  | ||||||
|     int_or_none, |  | ||||||
| ) |  | ||||||
|  |  | ||||||
|  |  | ||||||
| class ChirbitIE(InfoExtractor): | class ChirbitIE(InfoExtractor): | ||||||
|     IE_NAME = 'chirbit' |     IE_NAME = 'chirbit' | ||||||
|     _VALID_URL = r'https?://(?:www\.)?chirb\.it/(?:(?:wp|pl)/|fb_chirbit_player\.swf\?key=)?(?P<id>[\da-zA-Z]+)' |     _VALID_URL = r'https?://(?:www\.)?chirb\.it/(?:(?:wp|pl)/|fb_chirbit_player\.swf\?key=)?(?P<id>[\da-zA-Z]+)' | ||||||
|     _TESTS = [{ |     _TESTS = [{ | ||||||
|         'url': 'http://chirb.it/PrIPv5', |         'url': 'http://chirb.it/be2abG', | ||||||
|         'md5': '9847b0dad6ac3e074568bf2cfb197de8', |  | ||||||
|         'info_dict': { |         'info_dict': { | ||||||
|             'id': 'PrIPv5', |             'id': 'be2abG', | ||||||
|             'ext': 'mp3', |             'ext': 'mp3', | ||||||
|             'title': 'Фасадстрой', |             'title': 'md5:f542ea253f5255240be4da375c6a5d7e', | ||||||
|             'duration': 52, |             'description': 'md5:f24a4e22a71763e32da5fed59e47c770', | ||||||
|             'view_count': int, |             'duration': 306, | ||||||
|             'comment_count': int, |         }, | ||||||
|  |         'params': { | ||||||
|  |             'skip_download': True, | ||||||
|         } |         } | ||||||
|     }, { |     }, { | ||||||
|         'url': 'https://chirb.it/fb_chirbit_player.swf?key=PrIPv5', |         'url': 'https://chirb.it/fb_chirbit_player.swf?key=PrIPv5', | ||||||
|         'only_matching': True, |         'only_matching': True, | ||||||
|  |     }, { | ||||||
|  |         'url': 'https://chirb.it/wp/MN58c2', | ||||||
|  |         'only_matching': True, | ||||||
|     }] |     }] | ||||||
|  |  | ||||||
|     def _real_extract(self, url): |     def _real_extract(self, url): | ||||||
| @@ -33,27 +36,30 @@ class ChirbitIE(InfoExtractor): | |||||||
|         webpage = self._download_webpage( |         webpage = self._download_webpage( | ||||||
|             'http://chirb.it/%s' % audio_id, audio_id) |             'http://chirb.it/%s' % audio_id, audio_id) | ||||||
|  |  | ||||||
|         audio_url = self._search_regex( |         data_fd = self._search_regex( | ||||||
|             r'"setFile"\s*,\s*"([^"]+)"', webpage, 'audio url') |             r'data-fd=(["\'])(?P<url>(?:(?!\1).)+)\1', | ||||||
|  |             webpage, 'data fd', group='url') | ||||||
|  |  | ||||||
|  |         # Reverse engineered from https://chirb.it/js/chirbit.player.js (look | ||||||
|  |         # for soundURL) | ||||||
|  |         audio_url = base64.b64decode( | ||||||
|  |             data_fd[::-1].encode('ascii')).decode('utf-8') | ||||||
|  |  | ||||||
|         title = self._search_regex( |         title = self._search_regex( | ||||||
|             r'itemprop="name">([^<]+)', webpage, 'title') |             r'class=["\']chirbit-title["\'][^>]*>([^<]+)', webpage, 'title') | ||||||
|         duration = parse_duration(self._html_search_meta( |         description = self._search_regex( | ||||||
|             'duration', webpage, 'duration', fatal=False)) |             r'<h3>Description</h3>\s*<pre[^>]*>([^<]+)</pre>', | ||||||
|         view_count = int_or_none(self._search_regex( |             webpage, 'description', default=None) | ||||||
|             r'itemprop="playCount"\s*>(\d+)', webpage, |         duration = parse_duration(self._search_regex( | ||||||
|             'listen count', fatal=False)) |             r'class=["\']c-length["\'][^>]*>([^<]+)', | ||||||
|         comment_count = int_or_none(self._search_regex( |             webpage, 'duration', fatal=False)) | ||||||
|             r'>(\d+) Comments?:', webpage, |  | ||||||
|             'comment count', fatal=False)) |  | ||||||
|  |  | ||||||
|         return { |         return { | ||||||
|             'id': audio_id, |             'id': audio_id, | ||||||
|             'url': audio_url, |             'url': audio_url, | ||||||
|             'title': title, |             'title': title, | ||||||
|  |             'description': description, | ||||||
|             'duration': duration, |             'duration': duration, | ||||||
|             'view_count': view_count, |  | ||||||
|             'comment_count': comment_count, |  | ||||||
|         } |         } | ||||||
|  |  | ||||||
|  |  | ||||||
|   | |||||||
		Reference in New Issue
	
	Block a user