[nzz] Add new extractor(#4407)
This commit is contained in:
		| @@ -638,6 +638,7 @@ from .nytimes import ( | ||||
|     NYTimesArticleIE, | ||||
| ) | ||||
| from .nuvid import NuvidIE | ||||
| from .nzz import NZZIE | ||||
| from .odatv import OdaTVIE | ||||
| from .odnoklassniki import OdnoklassnikiIE | ||||
| from .oktoberfesttv import OktoberfestTVIE | ||||
|   | ||||
							
								
								
									
										36
									
								
								youtube_dl/extractor/nzz.py
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										36
									
								
								youtube_dl/extractor/nzz.py
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,36 @@ | ||||
| # coding: utf-8 | ||||
| from __future__ import unicode_literals | ||||
|  | ||||
| import re | ||||
|  | ||||
| from .common import InfoExtractor | ||||
| from ..utils import ( | ||||
|     extract_attributes, | ||||
| ) | ||||
|  | ||||
|  | ||||
| class NZZIE(InfoExtractor): | ||||
|     _VALID_URL = r'https?://(?:www\.)?nzz\.ch/(?:[^/]+/)*[^/?#]+-ld\.(?P<id>\d+)' | ||||
|     _TEST = { | ||||
|         'url': 'http://www.nzz.ch/zuerich/gymizyte/gymizyte-schreiben-schueler-heute-noch-diktate-ld.9153', | ||||
|         'info_dict': { | ||||
|             'id': '9153', | ||||
|         }, | ||||
|         'playlist_mincount': 6, | ||||
|     } | ||||
|  | ||||
|     def _real_extract(self, url): | ||||
|         page_id = self._match_id(url) | ||||
|         webpage = self._download_webpage(url, page_id) | ||||
|  | ||||
|         entries = [] | ||||
|         for player_element in re.findall(r'(<[^>]+class="kalturaPlayer"[^>]*>)', webpage): | ||||
|             player_params = extract_attributes(player_element) | ||||
|             if player_params.get('data-type') not in ('kaltura_singleArticle',): | ||||
|                 self.report_warning('Unsupported player type') | ||||
|                 continue | ||||
|             entry_id = player_params['data-id'] | ||||
|             entries.append(self.url_result( | ||||
|                 'kaltura:1750922:' + entry_id, 'Kaltura', entry_id)) | ||||
|  | ||||
|         return self.playlist_result(entries, page_id) | ||||
		Reference in New Issue
	
	Block a user