[buzzfeed] Add new extractor (Fixes #4259)
This commit is contained in:
		@@ -38,6 +38,7 @@ from .bpb import BpbIE
 | 
			
		||||
from .br import BRIE
 | 
			
		||||
from .breakcom import BreakIE
 | 
			
		||||
from .brightcove import BrightcoveIE
 | 
			
		||||
from .buzzfeed import BuzzFeedIE
 | 
			
		||||
from .byutv import BYUtvIE
 | 
			
		||||
from .c56 import C56IE
 | 
			
		||||
from .canal13cl import Canal13clIE
 | 
			
		||||
 
 | 
			
		||||
							
								
								
									
										52
									
								
								youtube_dl/extractor/buzzfeed.py
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										52
									
								
								youtube_dl/extractor/buzzfeed.py
									
									
									
									
									
										Normal file
									
								
							@@ -0,0 +1,52 @@
 | 
			
		||||
# coding: utf-8
 | 
			
		||||
from __future__ import unicode_literals
 | 
			
		||||
 | 
			
		||||
import json
 | 
			
		||||
import re
 | 
			
		||||
 | 
			
		||||
from .common import InfoExtractor
 | 
			
		||||
 | 
			
		||||
 | 
			
		||||
class BuzzFeedIE(InfoExtractor):
 | 
			
		||||
    _VALID_URL = r'https?://(?:www\.)?buzzfeed\.com/[^?#]*?/(?P<id>[^?#]+)'
 | 
			
		||||
    _TEST = {
 | 
			
		||||
        'url': 'http://www.buzzfeed.com/abagg/this-angry-ram-destroys-a-punching-bag-like-a-boss?utm_term=4ldqpia',
 | 
			
		||||
        'info_dict': {
 | 
			
		||||
            'id': 'this-angry-ram-destroys-a-punching-bag-like-a-boss',
 | 
			
		||||
            'title': 'This Angry Ram Destroys A Punching Bag Like A Boss',
 | 
			
		||||
            'description': 'Rambro!',
 | 
			
		||||
        },
 | 
			
		||||
        'playlist': [{
 | 
			
		||||
            'info_dict': {
 | 
			
		||||
                'id': 'aVCR29aE_OQ',
 | 
			
		||||
                'ext': 'mp4',
 | 
			
		||||
                'upload_date': '20141024',
 | 
			
		||||
                'uploader_id': 'Buddhanz1',
 | 
			
		||||
                'description': 'He likes to stay in shape with his heavy bag, he wont stop until its on the ground\n\nFollow Angry Ram on Facebook for regular updates -\nhttps://www.facebook.com/pages/Angry-Ram/1436897249899558?ref=hl',
 | 
			
		||||
                'uploader': 'Buddhanz',
 | 
			
		||||
                'title': 'Angry Ram destroys a punching bag',
 | 
			
		||||
            }
 | 
			
		||||
        }]
 | 
			
		||||
    }
 | 
			
		||||
 | 
			
		||||
    def _real_extract(self, url):
 | 
			
		||||
        playlist_id = self._match_id(url)
 | 
			
		||||
        webpage = self._download_webpage(url, playlist_id)
 | 
			
		||||
 | 
			
		||||
        all_buckets = re.findall(
 | 
			
		||||
            r'<div class="video-embed-videopost[^"]*".*?rel:bf_bucket_data=\'([^\']+)\'',
 | 
			
		||||
            webpage)
 | 
			
		||||
        entries = []
 | 
			
		||||
        for bd_json in all_buckets:
 | 
			
		||||
            bd = json.loads(bd_json)
 | 
			
		||||
            if 'video' not in bd:
 | 
			
		||||
                continue
 | 
			
		||||
            entries.append(self.url_result(bd['video']['url']))
 | 
			
		||||
 | 
			
		||||
        return {
 | 
			
		||||
            '_type': 'playlist',
 | 
			
		||||
            'id': playlist_id,
 | 
			
		||||
            'title': self._og_search_title(webpage),
 | 
			
		||||
            'description': self._og_search_description(webpage),
 | 
			
		||||
            'entries': entries,
 | 
			
		||||
        }
 | 
			
		||||
		Reference in New Issue
	
	Block a user