added an IE for criterion.com
This commit is contained in:
		@@ -8,6 +8,7 @@ from .breakcom import BreakIE
 | 
				
			|||||||
from .brightcove import BrightcoveIE
 | 
					from .brightcove import BrightcoveIE
 | 
				
			||||||
from .collegehumor import CollegeHumorIE
 | 
					from .collegehumor import CollegeHumorIE
 | 
				
			||||||
from .comedycentral import ComedyCentralIE
 | 
					from .comedycentral import ComedyCentralIE
 | 
				
			||||||
 | 
					from .criterion import CriterionIE
 | 
				
			||||||
from .cspan import CSpanIE
 | 
					from .cspan import CSpanIE
 | 
				
			||||||
from .dailymotion import DailymotionIE
 | 
					from .dailymotion import DailymotionIE
 | 
				
			||||||
from .depositfiles import DepositFilesIE
 | 
					from .depositfiles import DepositFilesIE
 | 
				
			||||||
 
 | 
				
			|||||||
							
								
								
									
										31
									
								
								youtube_dl/extractor/criterion.py
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										31
									
								
								youtube_dl/extractor/criterion.py
									
									
									
									
									
										Normal file
									
								
							@@ -0,0 +1,31 @@
 | 
				
			|||||||
 | 
					# -*- coding: utf-8 -*-
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					import re
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					from .common import InfoExtractor
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					class CriterionIE(InfoExtractor):
 | 
				
			||||||
 | 
					    _VALID_URL = r'http://www.criterion.com/films/(.*)'
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					    def _real_extract(self, url):
 | 
				
			||||||
 | 
					        mobj = re.match(self._VALID_URL, url)
 | 
				
			||||||
 | 
					        video_id = mobj.group(1).split('-')[0]
 | 
				
			||||||
 | 
					        webpage = self._download_webpage(url, video_id)
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					        final_url = self._search_regex(r'so.addVariable\("videoURL", "(.+?)"\)\;',
 | 
				
			||||||
 | 
					                                webpage, 'video url')
 | 
				
			||||||
 | 
					        title = self._search_regex(r'<meta content="(.+?)" property="og:title" />',
 | 
				
			||||||
 | 
					                                webpage, 'video title')
 | 
				
			||||||
 | 
					        description = self._search_regex(r'<meta name="description" content="(.+?)" />',
 | 
				
			||||||
 | 
					                                webpage, 'video description')
 | 
				
			||||||
 | 
					        thumbnail = self._search_regex(r'so.addVariable\("thumbnailURL", "(.+?)"\)\;',
 | 
				
			||||||
 | 
					                                webpage, 'thumbnail url')
 | 
				
			||||||
 | 
					        ext = final_url.split('.')[-1]
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					        return {'id': video_id,
 | 
				
			||||||
 | 
					                'url' : final_url,
 | 
				
			||||||
 | 
					                'title': title,
 | 
				
			||||||
 | 
					                'ext': ext,
 | 
				
			||||||
 | 
					                'description': description,
 | 
				
			||||||
 | 
					                'thumbnail': thumbnail,
 | 
				
			||||||
 | 
					                }
 | 
				
			||||||
		Reference in New Issue
	
	Block a user